upstream/mercurial-mirror Commit - r48192:9b841267

1

# util.py - Mercurial utility functions and platform specific implementations

1

# util.py - Mercurial utility functions and platform specific implementations

2

#

2

#

3

4

5

6

#

6

#

7

# This software may be used and distributed according to the terms of the

7

# This software may be used and distributed according to the terms of the

8

# GNU General Public License version 2 or any later version.

8

# GNU General Public License version 2 or any later version.

9

10

"""Mercurial utility functions and platform specific implementations.

10

"""Mercurial utility functions and platform specific implementations.

11

12

This contains helper routines that are independent of the SCM core and

12

This contains helper routines that are independent of the SCM core and

13

hide platform-specific details from the core.

13

hide platform-specific details from the core.

14

"""

14

"""

15

16

from __future__ import absolute_import, print_function

16

from __future__ import absolute_import, print_function

17

18

import abc

18

import abc

19

import collections

19

import collections

20

import contextlib

20

import contextlib

21

import errno

21

import errno

22

import gc

22

import gc

23

import hashlib

23

import hashlib

24

import itertools

24

import itertools

25

import locale

25

import locale

26

import mmap

26

import mmap

27

import os

27

import os

28

import platform as pyplatform

28

import platform as pyplatform

29

import re as remod

29

import re as remod

30

import shutil

30

import shutil

31

import stat

31

import stat

32

import sys

32

import sys

33

import time

33

import time

34

import traceback

34

import traceback

35

import warnings

35

import warnings

36

37

from .node import hex

37

from .node import hex

38

from .thirdparty import attr

38

from .thirdparty import attr

39

from .pycompat import (

39

from .pycompat import (

40

delattr,

40

delattr,

41

getattr,

41

getattr,

42

open,

42

open,

43

setattr,

43

setattr,

44

)

44

)

45

from .node import hex

45

from .node import hex

46

from hgdemandimport import tracing

46

from hgdemandimport import tracing

47

from . import (

47

from . import (

48

encoding,

48

encoding,

49

error,

49

error,

50

i18n,

50

i18n,

51

policy,

51

policy,

52

pycompat,

52

pycompat,

53

urllibcompat,

53

urllibcompat,

54

)

54

)

55

from .utils import (

55

from .utils import (

56

compression,

56

compression,

57

hashutil,

57

hashutil,

58

procutil,

58

procutil,

59

stringutil,

59

stringutil,

60

urlutil,

60

urlutil,

61

)

61

)

62

63

if pycompat.TYPE_CHECKING:

63

if pycompat.TYPE_CHECKING:

64

from typing import (

64

from typing import (

65

Iterator,

65

Iterator,

66

List,

66

List,

67

Optional,

67

Optional,

68

Tuple,

68

Tuple,

69

)

69

)

70

71

72

base85 = policy.importmod('base85')

72

base85 = policy.importmod('base85')

73

osutil = policy.importmod('osutil')

73

osutil = policy.importmod('osutil')

74

75

b85decode = base85.b85decode

75

b85decode = base85.b85decode

76

b85encode = base85.b85encode

76

b85encode = base85.b85encode

77

78

cookielib = pycompat.cookielib

78

cookielib = pycompat.cookielib

79

httplib = pycompat.httplib

79

httplib = pycompat.httplib

80

pickle = pycompat.pickle

80

pickle = pycompat.pickle

81

safehasattr = pycompat.safehasattr

81

safehasattr = pycompat.safehasattr

82

socketserver = pycompat.socketserver

82

socketserver = pycompat.socketserver

83

bytesio = pycompat.bytesio

83

bytesio = pycompat.bytesio

84

# TODO deprecate stringio name, as it is a lie on Python 3.

84

# TODO deprecate stringio name, as it is a lie on Python 3.

85

stringio = bytesio

85

stringio = bytesio

86

xmlrpclib = pycompat.xmlrpclib

86

xmlrpclib = pycompat.xmlrpclib

87

88

httpserver = urllibcompat.httpserver

88

httpserver = urllibcompat.httpserver

89

urlerr = urllibcompat.urlerr

89

urlerr = urllibcompat.urlerr

90

urlreq = urllibcompat.urlreq

90

urlreq = urllibcompat.urlreq

91

92

# workaround for win32mbcs

92

# workaround for win32mbcs

93

_filenamebytestr = pycompat.bytestr

93

_filenamebytestr = pycompat.bytestr

94

95

if pycompat.iswindows:

95

if pycompat.iswindows:

96

from . import windows as platform

96

from . import windows as platform

97

else:

97

else:

98

from . import posix as platform

98

from . import posix as platform

99

100

_ = i18n._

100

_ = i18n._

101

102

bindunixsocket = platform.bindunixsocket

102

bindunixsocket = platform.bindunixsocket

103

cachestat = platform.cachestat

103

cachestat = platform.cachestat

104

checkexec = platform.checkexec

104

checkexec = platform.checkexec

105

checklink = platform.checklink

105

checklink = platform.checklink

106

copymode = platform.copymode

106

copymode = platform.copymode

107

expandglobs = platform.expandglobs

107

expandglobs = platform.expandglobs

108

getfsmountpoint = platform.getfsmountpoint

108

getfsmountpoint = platform.getfsmountpoint

109

getfstype = platform.getfstype

109

getfstype = platform.getfstype

110

get_password = platform.get_password

110

get_password = platform.get_password

111

groupmembers = platform.groupmembers

111

groupmembers = platform.groupmembers

112

groupname = platform.groupname

112

groupname = platform.groupname

113

isexec = platform.isexec

113

isexec = platform.isexec

114

isowner = platform.isowner

114

isowner = platform.isowner

115

listdir = osutil.listdir

115

listdir = osutil.listdir

116

localpath = platform.localpath

116

localpath = platform.localpath

117

lookupreg = platform.lookupreg

117

lookupreg = platform.lookupreg

118

makedir = platform.makedir

118

makedir = platform.makedir

119

nlinks = platform.nlinks

119

nlinks = platform.nlinks

120

normpath = platform.normpath

120

normpath = platform.normpath

121

normcase = platform.normcase

121

normcase = platform.normcase

122

normcasespec = platform.normcasespec

122

normcasespec = platform.normcasespec

123

normcasefallback = platform.normcasefallback

123

normcasefallback = platform.normcasefallback

124

openhardlinks = platform.openhardlinks

124

openhardlinks = platform.openhardlinks

125

oslink = platform.oslink

125

oslink = platform.oslink

126

parsepatchoutput = platform.parsepatchoutput

126

parsepatchoutput = platform.parsepatchoutput

127

pconvert = platform.pconvert

127

pconvert = platform.pconvert

128

poll = platform.poll

128

poll = platform.poll

129

posixfile = platform.posixfile

129

posixfile = platform.posixfile

130

readlink = platform.readlink

130

readlink = platform.readlink

131

rename = platform.rename

131

rename = platform.rename

132

removedirs = platform.removedirs

132

removedirs = platform.removedirs

133

samedevice = platform.samedevice

133

samedevice = platform.samedevice

134

samefile = platform.samefile

134

samefile = platform.samefile

135

samestat = platform.samestat

135

samestat = platform.samestat

136

setflags = platform.setflags

136

setflags = platform.setflags

137

split = platform.split

137

split = platform.split

138

statfiles = getattr(osutil, 'statfiles', platform.statfiles)

138

statfiles = getattr(osutil, 'statfiles', platform.statfiles)

139

statisexec = platform.statisexec

139

statisexec = platform.statisexec

140

statislink = platform.statislink

140

statislink = platform.statislink

141

umask = platform.umask

141

umask = platform.umask

142

unlink = platform.unlink

142

unlink = platform.unlink

143

username = platform.username

143

username = platform.username

144

145

146

def setumask(val):

146

def setumask(val):

147

# type: (int) -> None

147

# type: (int) -> None

148

'''updates the umask. used by chg server'''

148

'''updates the umask. used by chg server'''

149

if pycompat.iswindows:

149

if pycompat.iswindows:

150

return

150

return

151

os.umask(val)

151

os.umask(val)

152

global umask

152

global umask

153

platform.umask = umask = val & 0o777

153

platform.umask = umask = val & 0o777

154

155

156

# small compat layer

156

# small compat layer

157

compengines = compression.compengines

157

compengines = compression.compengines

158

SERVERROLE = compression.SERVERROLE

158

SERVERROLE = compression.SERVERROLE

159

CLIENTROLE = compression.CLIENTROLE

159

CLIENTROLE = compression.CLIENTROLE

160

161

try:

161

try:

162

recvfds = osutil.recvfds

162

recvfds = osutil.recvfds

163

except AttributeError:

163

except AttributeError:

164

pass

164

pass

165

166

# Python compatibility

166

# Python compatibility

167

168

_notset = object()

168

_notset = object()

169

170

171

def bitsfrom(container):

171

def bitsfrom(container):

172

bits = 0

172

bits = 0

173

for bit in container:

173

for bit in container:

174

bits |= bit

174

bits |= bit

175

return bits

175

return bits

176

177

178

# python 2.6 still have deprecation warning enabled by default. We do not want

178

# python 2.6 still have deprecation warning enabled by default. We do not want

179

# to display anything to standard user so detect if we are running test and

179

# to display anything to standard user so detect if we are running test and

180

# only use python deprecation warning in this case.

180

# only use python deprecation warning in this case.

181

_dowarn = bool(encoding.environ.get(b'HGEMITWARNINGS'))

181

_dowarn = bool(encoding.environ.get(b'HGEMITWARNINGS'))

182

if _dowarn:

182

if _dowarn:

183

# explicitly unfilter our warning for python 2.7

183

# explicitly unfilter our warning for python 2.7

184

#

184

#

185

# The option of setting PYTHONWARNINGS in the test runner was investigated.

185

# The option of setting PYTHONWARNINGS in the test runner was investigated.

186

# However, module name set through PYTHONWARNINGS was exactly matched, so

186

# However, module name set through PYTHONWARNINGS was exactly matched, so

187

# we cannot set 'mercurial' and have it match eg: 'mercurial.scmutil'. This

187

# we cannot set 'mercurial' and have it match eg: 'mercurial.scmutil'. This

188

# makes the whole PYTHONWARNINGS thing useless for our usecase.

188

# makes the whole PYTHONWARNINGS thing useless for our usecase.

189

warnings.filterwarnings('default', '', DeprecationWarning, 'mercurial')

189

warnings.filterwarnings('default', '', DeprecationWarning, 'mercurial')

190

warnings.filterwarnings('default', '', DeprecationWarning, 'hgext')

190

warnings.filterwarnings('default', '', DeprecationWarning, 'hgext')

191

warnings.filterwarnings('default', '', DeprecationWarning, 'hgext3rd')

191

warnings.filterwarnings('default', '', DeprecationWarning, 'hgext3rd')

192

if _dowarn and pycompat.ispy3:

192

if _dowarn and pycompat.ispy3:

193

# silence warning emitted by passing user string to re.sub()

193

# silence warning emitted by passing user string to re.sub()

194

warnings.filterwarnings(

194

warnings.filterwarnings(

195

'ignore', 'bad escape', DeprecationWarning, 'mercurial'

195

'ignore', 'bad escape', DeprecationWarning, 'mercurial'

196

)

196

)

197

warnings.filterwarnings(

197

warnings.filterwarnings(

198

'ignore', 'invalid escape sequence', DeprecationWarning, 'mercurial'

198

'ignore', 'invalid escape sequence', DeprecationWarning, 'mercurial'

199

)

199

)

200

# TODO: reinvent imp.is_frozen()

200

# TODO: reinvent imp.is_frozen()

201

warnings.filterwarnings(

201

warnings.filterwarnings(

202

'ignore',

202

'ignore',

203

'the imp module is deprecated',

203

'the imp module is deprecated',

204

DeprecationWarning,

204

DeprecationWarning,

205

'mercurial',

205

'mercurial',

206

)

206

)

207

208

209

def nouideprecwarn(msg, version, stacklevel=1):

209

def nouideprecwarn(msg, version, stacklevel=1):

210

"""Issue an python native deprecation warning

210

"""Issue an python native deprecation warning

211

212

This is a noop outside of tests, use 'ui.deprecwarn' when possible.

212

This is a noop outside of tests, use 'ui.deprecwarn' when possible.

213

"""

213

"""

214

if _dowarn:

214

if _dowarn:

215

msg += (

215

msg += (

216

b"\n(compatibility will be dropped after Mercurial-%s,"

216

b"\n(compatibility will be dropped after Mercurial-%s,"

217

b" update your code.)"

217

b" update your code.)"

218

) % version

218

) % version

219

warnings.warn(pycompat.sysstr(msg), DeprecationWarning, stacklevel + 1)

219

warnings.warn(pycompat.sysstr(msg), DeprecationWarning, stacklevel + 1)

220

# on python 3 with chg, we will need to explicitly flush the output

220

# on python 3 with chg, we will need to explicitly flush the output

221

sys.stderr.flush()

221

sys.stderr.flush()

222

223

224

DIGESTS = {

224

DIGESTS = {

225

b'md5': hashlib.md5,

225

b'md5': hashlib.md5,

226

b'sha1': hashutil.sha1,

226

b'sha1': hashutil.sha1,

227

b'sha512': hashlib.sha512,

227

b'sha512': hashlib.sha512,

228

}

228

}

229

# List of digest types from strongest to weakest

229

# List of digest types from strongest to weakest

230

DIGESTS_BY_STRENGTH = [b'sha512', b'sha1', b'md5']

230

DIGESTS_BY_STRENGTH = [b'sha512', b'sha1', b'md5']

231

232

for k in DIGESTS_BY_STRENGTH:

232

for k in DIGESTS_BY_STRENGTH:

233

assert k in DIGESTS

233

assert k in DIGESTS

234

235

236

class digester(object):

236

class digester(object):

237

"""helper to compute digests.

237

"""helper to compute digests.

238

239

This helper can be used to compute one or more digests given their name.

239

This helper can be used to compute one or more digests given their name.

240

241

>>> d = digester([b'md5', b'sha1'])

241

>>> d = digester([b'md5', b'sha1'])

242

>>> d.update(b'foo')

242

>>> d.update(b'foo')

243

>>> [k for k in sorted(d)]

243

>>> [k for k in sorted(d)]

244

['md5', 'sha1']

244

['md5', 'sha1']

245

>>> d[b'md5']

245

>>> d[b'md5']

246

'acbd18db4cc2f85cedef654fccc4a4d8'

246

'acbd18db4cc2f85cedef654fccc4a4d8'

247

>>> d[b'sha1']

247

>>> d[b'sha1']

248

'0beec7b5ea3f0fdbc95d0dd47f3c5bc275da8a33'

248

'0beec7b5ea3f0fdbc95d0dd47f3c5bc275da8a33'

249

>>> digester.preferred([b'md5', b'sha1'])

249

>>> digester.preferred([b'md5', b'sha1'])

250

'sha1'

250

'sha1'

251

"""

251

"""

252

253

def __init__(self, digests, s=b''):

253

def __init__(self, digests, s=b''):

254

self._hashes = {}

254

self._hashes = {}

255

for k in digests:

255

for k in digests:

256

if k not in DIGESTS:

256

if k not in DIGESTS:

257

raise error.Abort(_(b'unknown digest type: %s') % k)

257

raise error.Abort(_(b'unknown digest type: %s') % k)

258

self._hashes[k] = DIGESTS[k]()

258

self._hashes[k] = DIGESTS[k]()

259

if s:

259

if s:

260

self.update(s)

260

self.update(s)

261

262

def update(self, data):

262

def update(self, data):

263

for h in self._hashes.values():

263

for h in self._hashes.values():

264

h.update(data)

264

h.update(data)

265

266

def __getitem__(self, key):

266

def __getitem__(self, key):

267

if key not in DIGESTS:

267

if key not in DIGESTS:

268

raise error.Abort(_(b'unknown digest type: %s') % k)

268

raise error.Abort(_(b'unknown digest type: %s') % k)

269

return hex(self._hashes[key].digest())

269

return hex(self._hashes[key].digest())

270

271

def __iter__(self):

271

def __iter__(self):

272

return iter(self._hashes)

272

return iter(self._hashes)

273

274

@staticmethod

274

@staticmethod

275

def preferred(supported):

275

def preferred(supported):

276

"""returns the strongest digest type in both supported and DIGESTS."""

276

"""returns the strongest digest type in both supported and DIGESTS."""

277

278

for k in DIGESTS_BY_STRENGTH:

278

for k in DIGESTS_BY_STRENGTH:

279

if k in supported:

279

if k in supported:

280

return k

280

return k

281

return None

281

return None

282

283

284

class digestchecker(object):

284

class digestchecker(object):

285

"""file handle wrapper that additionally checks content against a given

285

"""file handle wrapper that additionally checks content against a given

286

size and digests.

286

size and digests.

287

288

d = digestchecker(fh, size, {'md5': '...'})

288

d = digestchecker(fh, size, {'md5': '...'})

289

290

When multiple digests are given, all of them are validated.

290

When multiple digests are given, all of them are validated.

291

"""

291

"""

292

293

def __init__(self, fh, size, digests):

293

def __init__(self, fh, size, digests):

294

self._fh = fh

294

self._fh = fh

295

self._size = size

295

self._size = size

296

self._got = 0

296

self._got = 0

297

self._digests = dict(digests)

297

self._digests = dict(digests)

298

self._digester = digester(self._digests.keys())

298

self._digester = digester(self._digests.keys())

299

300

def read(self, length=-1):

300

def read(self, length=-1):

301

content = self._fh.read(length)

301

content = self._fh.read(length)

302

self._digester.update(content)

302

self._digester.update(content)

303

self._got += len(content)

303

self._got += len(content)

304

return content

304

return content

305

306

def validate(self):

306

def validate(self):

307

if self._size != self._got:

307

if self._size != self._got:

308

raise error.Abort(

308

raise error.Abort(

309

_(b'size mismatch: expected %d, got %d')

309

_(b'size mismatch: expected %d, got %d')

310

% (self._size, self._got)

310

% (self._size, self._got)

311

)

311

)

312

for k, v in self._digests.items():

312

for k, v in self._digests.items():

313

if v != self._digester[k]:

313

if v != self._digester[k]:

314

# i18n: first parameter is a digest name

314

# i18n: first parameter is a digest name

315

raise error.Abort(

315

raise error.Abort(

316

_(b'%s mismatch: expected %s, got %s')

316

_(b'%s mismatch: expected %s, got %s')

317

% (k, v, self._digester[k])

317

% (k, v, self._digester[k])

318

)

318

)

319

320

321

try:

321

try:

322

buffer = buffer # pytype: disable=name-error

322

buffer = buffer # pytype: disable=name-error

323

except NameError:

323

except NameError:

324

325

def buffer(sliceable, offset=0, length=None):

325

def buffer(sliceable, offset=0, length=None):

326

if length is not None:

326

if length is not None:

327

return memoryview(sliceable)[offset : offset + length]

327

return memoryview(sliceable)[offset : offset + length]

328

return memoryview(sliceable)[offset:]

328

return memoryview(sliceable)[offset:]

329

330

331

_chunksize = 4096

331

_chunksize = 4096

332

333

334

class bufferedinputpipe(object):

334

class bufferedinputpipe(object):

335

"""a manually buffered input pipe

335

"""a manually buffered input pipe

336

337

Python will not let us use buffered IO and lazy reading with 'polling' at

337

Python will not let us use buffered IO and lazy reading with 'polling' at

338

the same time. We cannot probe the buffer state and select will not detect

338

the same time. We cannot probe the buffer state and select will not detect

339

that data are ready to read if they are already buffered.

339

that data are ready to read if they are already buffered.

340

341

This class let us work around that by implementing its own buffering

341

This class let us work around that by implementing its own buffering

342

(allowing efficient readline) while offering a way to know if the buffer is

342

(allowing efficient readline) while offering a way to know if the buffer is

343

empty from the output (allowing collaboration of the buffer with polling).

343

empty from the output (allowing collaboration of the buffer with polling).

344

345

This class lives in the 'util' module because it makes use of the 'os'

345

This class lives in the 'util' module because it makes use of the 'os'

346

module from the python stdlib.

346

module from the python stdlib.

347

"""

347

"""

348

349

def __new__(cls, fh):

349

def __new__(cls, fh):

350

# If we receive a fileobjectproxy, we need to use a variation of this

350

# If we receive a fileobjectproxy, we need to use a variation of this

351

# class that notifies observers about activity.

351

# class that notifies observers about activity.

352

if isinstance(fh, fileobjectproxy):

352

if isinstance(fh, fileobjectproxy):

353

cls = observedbufferedinputpipe

353

cls = observedbufferedinputpipe

354

355

return super(bufferedinputpipe, cls).__new__(cls)

355

return super(bufferedinputpipe, cls).__new__(cls)

356

357

def __init__(self, input):

357

def __init__(self, input):

358

self._input = input

358

self._input = input

359

self._buffer = []

359

self._buffer = []

360

self._eof = False

360

self._eof = False

361

self._lenbuf = 0

361

self._lenbuf = 0

362

363

@property

363

@property

364

def hasbuffer(self):

364

def hasbuffer(self):

365

"""True is any data is currently buffered

365

"""True is any data is currently buffered

366

367

This will be used externally a pre-step for polling IO. If there is

367

This will be used externally a pre-step for polling IO. If there is

368

already data then no polling should be set in place."""

368

already data then no polling should be set in place."""

369

return bool(self._buffer)

369

return bool(self._buffer)

370

371

@property

371

@property

372

def closed(self):

372

def closed(self):

373

return self._input.closed

373

return self._input.closed

374

375

def fileno(self):

375

def fileno(self):

376

return self._input.fileno()

376

return self._input.fileno()

377

378

def close(self):

378

def close(self):

379

return self._input.close()

379

return self._input.close()

380

381

def read(self, size):

381

def read(self, size):

382

while (not self._eof) and (self._lenbuf < size):

382

while (not self._eof) and (self._lenbuf < size):

383

self._fillbuffer()

383

self._fillbuffer()

384

return self._frombuffer(size)

384

return self._frombuffer(size)

385

386

def unbufferedread(self, size):

386

def unbufferedread(self, size):

387

if not self._eof and self._lenbuf == 0:

387

if not self._eof and self._lenbuf == 0:

388

self._fillbuffer(max(size, _chunksize))

388

self._fillbuffer(max(size, _chunksize))

389

return self._frombuffer(min(self._lenbuf, size))

389

return self._frombuffer(min(self._lenbuf, size))

390

391

def readline(self, *args, **kwargs):

391

def readline(self, *args, **kwargs):

392

if len(self._buffer) > 1:

392

if len(self._buffer) > 1:

393

# this should not happen because both read and readline end with a

393

# this should not happen because both read and readline end with a

394

# _frombuffer call that collapse it.

394

# _frombuffer call that collapse it.

395

self._buffer = [b''.join(self._buffer)]

395

self._buffer = [b''.join(self._buffer)]

396

self._lenbuf = len(self._buffer[0])

396

self._lenbuf = len(self._buffer[0])

397

lfi = -1

397

lfi = -1

398

if self._buffer:

398

if self._buffer:

399

lfi = self._buffer[-1].find(b'\n')

399

lfi = self._buffer[-1].find(b'\n')

400

while (not self._eof) and lfi < 0:

400

while (not self._eof) and lfi < 0:

401

self._fillbuffer()

401

self._fillbuffer()

402

if self._buffer:

402

if self._buffer:

403

lfi = self._buffer[-1].find(b'\n')

403

lfi = self._buffer[-1].find(b'\n')

404

size = lfi + 1

404

size = lfi + 1

405

if lfi < 0: # end of file

405

if lfi < 0: # end of file

406

size = self._lenbuf

406

size = self._lenbuf

407

elif len(self._buffer) > 1:

407

elif len(self._buffer) > 1:

408

# we need to take previous chunks into account

408

# we need to take previous chunks into account

409

size += self._lenbuf - len(self._buffer[-1])

409

size += self._lenbuf - len(self._buffer[-1])

410

return self._frombuffer(size)

410

return self._frombuffer(size)

411

412

def _frombuffer(self, size):

412

def _frombuffer(self, size):

413

"""return at most 'size' data from the buffer

413

"""return at most 'size' data from the buffer

414

415

The data are removed from the buffer."""

415

The data are removed from the buffer."""

416

if size == 0 or not self._buffer:

416

if size == 0 or not self._buffer:

417

return b''

417

return b''

418

buf = self._buffer[0]

418

buf = self._buffer[0]

419

if len(self._buffer) > 1:

419

if len(self._buffer) > 1:

420

buf = b''.join(self._buffer)

420

buf = b''.join(self._buffer)

421

422

data = buf[:size]

422

data = buf[:size]

423

buf = buf[len(data) :]

423

buf = buf[len(data) :]

424

if buf:

424

if buf:

425

self._buffer = [buf]

425

self._buffer = [buf]

426

self._lenbuf = len(buf)

426

self._lenbuf = len(buf)

427

else:

427

else:

428

self._buffer = []

428

self._buffer = []

429

self._lenbuf = 0

429

self._lenbuf = 0

430

return data

430

return data

431

432

def _fillbuffer(self, size=_chunksize):

432

def _fillbuffer(self, size=_chunksize):

433

"""read data to the buffer"""

433

"""read data to the buffer"""

434

data = os.read(self._input.fileno(), size)

434

data = os.read(self._input.fileno(), size)

435

if not data:

435

if not data:

436

self._eof = True

436

self._eof = True

437

else:

437

else:

438

self._lenbuf += len(data)

438

self._lenbuf += len(data)

439

self._buffer.append(data)

439

self._buffer.append(data)

440

441

return data

441

return data

442

443

444

def mmapread(fp, size=None):

444

def mmapread(fp, size=None):

445

if size == 0:

445

if size == 0:

446

# size of 0 to mmap.mmap() means "all data"

446

# size of 0 to mmap.mmap() means "all data"

447

# rather than "zero bytes", so special case that.

447

# rather than "zero bytes", so special case that.

448

return b''

448

return b''

449

elif size is None:

449

elif size is None:

450

size = 0

450

size = 0

451

try:

451

try:

452

fd = getattr(fp, 'fileno', lambda: fp)()

452

fd = getattr(fp, 'fileno', lambda: fp)()

453

return mmap.mmap(fd, size, access=mmap.ACCESS_READ)

453

return mmap.mmap(fd, size, access=mmap.ACCESS_READ)

454

except ValueError:

454

except ValueError:

455

# Empty files cannot be mmapped, but mmapread should still work. Check

455

# Empty files cannot be mmapped, but mmapread should still work. Check

456

# if the file is empty, and if so, return an empty buffer.

456

# if the file is empty, and if so, return an empty buffer.

457

if os.fstat(fd).st_size == 0:

457

if os.fstat(fd).st_size == 0:

458

return b''

458

return b''

459

raise

459

raise

460

461

462

class fileobjectproxy(object):

462

class fileobjectproxy(object):

463

"""A proxy around file objects that tells a watcher when events occur.

463

"""A proxy around file objects that tells a watcher when events occur.

464

465

This type is intended to only be used for testing purposes. Think hard

465

This type is intended to only be used for testing purposes. Think hard

466

before using it in important code.

466

before using it in important code.

467

"""

467

"""

468

469

__slots__ = (

469

__slots__ = (

470

'_orig',

470

'_orig',

471

'_observer',

471

'_observer',

472

)

472

)

473

474

def __init__(self, fh, observer):

474

def __init__(self, fh, observer):

475

object.__setattr__(self, '_orig', fh)

475

object.__setattr__(self, '_orig', fh)

476

object.__setattr__(self, '_observer', observer)

476

object.__setattr__(self, '_observer', observer)

477

478

def __getattribute__(self, name):

478

def __getattribute__(self, name):

479

ours = {

479

ours = {

480

'_observer',

480

'_observer',

481

# IOBase

481

# IOBase

482

'close',

482

'close',

483

# closed if a property

483

# closed if a property

484

'fileno',

484

'fileno',

485

'flush',

485

'flush',

486

'isatty',

486

'isatty',

487

'readable',

487

'readable',

488

'readline',

488

'readline',

489

'readlines',

489

'readlines',

490

'seek',

490

'seek',

491

'seekable',

491

'seekable',

492

'tell',

492

'tell',

493

'truncate',

493

'truncate',

494

'writable',

494

'writable',

495

'writelines',

495

'writelines',

496

# RawIOBase

496

# RawIOBase

497

'read',

497

'read',

498

'readall',

498

'readall',

499

'readinto',

499

'readinto',

500

'write',

500

'write',

501

# BufferedIOBase

501

# BufferedIOBase

502

# raw is a property

502

# raw is a property

503

'detach',

503

'detach',

504

# read defined above

504

# read defined above

505

'read1',

505

'read1',

506

# readinto defined above

506

# readinto defined above

507

# write defined above

507

# write defined above

508

}

508

}

509

510

# We only observe some methods.

510

# We only observe some methods.

511

if name in ours:

511

if name in ours:

512

return object.__getattribute__(self, name)

512

return object.__getattribute__(self, name)

513

514

return getattr(object.__getattribute__(self, '_orig'), name)

514

return getattr(object.__getattribute__(self, '_orig'), name)

515

516

def __nonzero__(self):

516

def __nonzero__(self):

517

return bool(object.__getattribute__(self, '_orig'))

517

return bool(object.__getattribute__(self, '_orig'))

518

519

__bool__ = __nonzero__

519

__bool__ = __nonzero__

520

521

def __delattr__(self, name):

521

def __delattr__(self, name):

522

return delattr(object.__getattribute__(self, '_orig'), name)

522

return delattr(object.__getattribute__(self, '_orig'), name)

523

524

def __setattr__(self, name, value):

524

def __setattr__(self, name, value):

525

return setattr(object.__getattribute__(self, '_orig'), name, value)

525

return setattr(object.__getattribute__(self, '_orig'), name, value)

526

527

def __iter__(self):

527

def __iter__(self):

528

return object.__getattribute__(self, '_orig').__iter__()

528

return object.__getattribute__(self, '_orig').__iter__()

529

530

def _observedcall(self, name, *args, **kwargs):

530

def _observedcall(self, name, *args, **kwargs):

531

# Call the original object.

531

# Call the original object.

532

orig = object.__getattribute__(self, '_orig')

532

orig = object.__getattribute__(self, '_orig')

533

res = getattr(orig, name)(*args, **kwargs)

533

res = getattr(orig, name)(*args, **kwargs)

534

535

# Call a method on the observer of the same name with arguments

535

# Call a method on the observer of the same name with arguments

536

# so it can react, log, etc.

536

# so it can react, log, etc.

537

observer = object.__getattribute__(self, '_observer')

537

observer = object.__getattribute__(self, '_observer')

538

fn = getattr(observer, name, None)

538

fn = getattr(observer, name, None)

539

if fn:

539

if fn:

540

fn(res, *args, **kwargs)

540

fn(res, *args, **kwargs)

541

542

return res

542

return res

543

544

def close(self, *args, **kwargs):

544

def close(self, *args, **kwargs):

545

return object.__getattribute__(self, '_observedcall')(

545

return object.__getattribute__(self, '_observedcall')(

546

'close', *args, **kwargs

546

'close', *args, **kwargs

547

)

547

)

548

549

def fileno(self, *args, **kwargs):

549

def fileno(self, *args, **kwargs):

550

return object.__getattribute__(self, '_observedcall')(

550

return object.__getattribute__(self, '_observedcall')(

551

'fileno', *args, **kwargs

551

'fileno', *args, **kwargs

552

)

552

)

553

554

def flush(self, *args, **kwargs):

554

def flush(self, *args, **kwargs):

555

return object.__getattribute__(self, '_observedcall')(

555

return object.__getattribute__(self, '_observedcall')(

556

'flush', *args, **kwargs

556

'flush', *args, **kwargs

557

)

557

)

558

559

def isatty(self, *args, **kwargs):

559

def isatty(self, *args, **kwargs):

560

return object.__getattribute__(self, '_observedcall')(

560

return object.__getattribute__(self, '_observedcall')(

561

'isatty', *args, **kwargs

561

'isatty', *args, **kwargs

562

)

562

)

563

564

def readable(self, *args, **kwargs):

564

def readable(self, *args, **kwargs):

565

return object.__getattribute__(self, '_observedcall')(

565

return object.__getattribute__(self, '_observedcall')(

566

'readable', *args, **kwargs

566

'readable', *args, **kwargs

567

)

567

)

568

569

def readline(self, *args, **kwargs):

569

def readline(self, *args, **kwargs):

570

return object.__getattribute__(self, '_observedcall')(

570

return object.__getattribute__(self, '_observedcall')(

571

'readline', *args, **kwargs

571

'readline', *args, **kwargs

572

)

572

)

573

574

def readlines(self, *args, **kwargs):

574

def readlines(self, *args, **kwargs):

575

return object.__getattribute__(self, '_observedcall')(

575

return object.__getattribute__(self, '_observedcall')(

576

'readlines', *args, **kwargs

576

'readlines', *args, **kwargs

577

)

577

)

578

579

def seek(self, *args, **kwargs):

579

def seek(self, *args, **kwargs):

580

return object.__getattribute__(self, '_observedcall')(

580

return object.__getattribute__(self, '_observedcall')(

581

'seek', *args, **kwargs

581

'seek', *args, **kwargs

582

)

582

)

583

584

def seekable(self, *args, **kwargs):

584

def seekable(self, *args, **kwargs):

585

return object.__getattribute__(self, '_observedcall')(

585

return object.__getattribute__(self, '_observedcall')(

586

'seekable', *args, **kwargs

586

'seekable', *args, **kwargs

587

)

587

)

588

589

def tell(self, *args, **kwargs):

589

def tell(self, *args, **kwargs):

590

return object.__getattribute__(self, '_observedcall')(

590

return object.__getattribute__(self, '_observedcall')(

591

'tell', *args, **kwargs

591

'tell', *args, **kwargs

592

)

592

)

593

594

def truncate(self, *args, **kwargs):

594

def truncate(self, *args, **kwargs):

595

return object.__getattribute__(self, '_observedcall')(

595

return object.__getattribute__(self, '_observedcall')(

596

'truncate', *args, **kwargs

596

'truncate', *args, **kwargs

597

)

597

)

598

599

def writable(self, *args, **kwargs):

599

def writable(self, *args, **kwargs):

600

return object.__getattribute__(self, '_observedcall')(

600

return object.__getattribute__(self, '_observedcall')(

601

'writable', *args, **kwargs

601

'writable', *args, **kwargs

602

)

602

)

603

604

def writelines(self, *args, **kwargs):

604

def writelines(self, *args, **kwargs):

605

return object.__getattribute__(self, '_observedcall')(

605

return object.__getattribute__(self, '_observedcall')(

606

'writelines', *args, **kwargs

606

'writelines', *args, **kwargs

607

)

607

)

608

609

def read(self, *args, **kwargs):

609

def read(self, *args, **kwargs):

610

return object.__getattribute__(self, '_observedcall')(

610

return object.__getattribute__(self, '_observedcall')(

611

'read', *args, **kwargs

611

'read', *args, **kwargs

612

)

612

)

613

614

def readall(self, *args, **kwargs):

614

def readall(self, *args, **kwargs):

615

return object.__getattribute__(self, '_observedcall')(

615

return object.__getattribute__(self, '_observedcall')(

616

'readall', *args, **kwargs

616

'readall', *args, **kwargs

617

)

617

)

618

619

def readinto(self, *args, **kwargs):

619

def readinto(self, *args, **kwargs):

620

return object.__getattribute__(self, '_observedcall')(

620

return object.__getattribute__(self, '_observedcall')(

621

'readinto', *args, **kwargs

621

'readinto', *args, **kwargs

622

)

622

)

623

624

def write(self, *args, **kwargs):

624

def write(self, *args, **kwargs):

625

return object.__getattribute__(self, '_observedcall')(

625

return object.__getattribute__(self, '_observedcall')(

626

'write', *args, **kwargs

626

'write', *args, **kwargs

627

)

627

)

628

629

def detach(self, *args, **kwargs):

629

def detach(self, *args, **kwargs):

630

return object.__getattribute__(self, '_observedcall')(

630

return object.__getattribute__(self, '_observedcall')(

631

'detach', *args, **kwargs

631

'detach', *args, **kwargs

632

)

632

)

633

634

def read1(self, *args, **kwargs):

634

def read1(self, *args, **kwargs):

635

return object.__getattribute__(self, '_observedcall')(

635

return object.__getattribute__(self, '_observedcall')(

636

'read1', *args, **kwargs

636

'read1', *args, **kwargs

637

)

637

)

638

639

640

class observedbufferedinputpipe(bufferedinputpipe):

640

class observedbufferedinputpipe(bufferedinputpipe):

641

"""A variation of bufferedinputpipe that is aware of fileobjectproxy.

641

"""A variation of bufferedinputpipe that is aware of fileobjectproxy.

642

643

``bufferedinputpipe`` makes low-level calls to ``os.read()`` that

643

``bufferedinputpipe`` makes low-level calls to ``os.read()`` that

644

bypass ``fileobjectproxy``. Because of this, we need to make

644

bypass ``fileobjectproxy``. Because of this, we need to make

645

``bufferedinputpipe`` aware of these operations.

645

``bufferedinputpipe`` aware of these operations.

646

647

This variation of ``bufferedinputpipe`` can notify observers about

647

This variation of ``bufferedinputpipe`` can notify observers about

648

``os.read()`` events. It also re-publishes other events, such as

648

``os.read()`` events. It also re-publishes other events, such as

649

``read()`` and ``readline()``.

649

``read()`` and ``readline()``.

650

"""

650

"""

651

652

def _fillbuffer(self):

652

def _fillbuffer(self):

653

res = super(observedbufferedinputpipe, self)._fillbuffer()

653

res = super(observedbufferedinputpipe, self)._fillbuffer()

654

655

fn = getattr(self._input._observer, 'osread', None)

655

fn = getattr(self._input._observer, 'osread', None)

656

if fn:

656

if fn:

657

fn(res, _chunksize)

657

fn(res, _chunksize)

658

659

return res

659

return res

660

661

# We use different observer methods because the operation isn't

661

# We use different observer methods because the operation isn't

662

# performed on the actual file object but on us.

662

# performed on the actual file object but on us.

663

def read(self, size):

663

def read(self, size):

664

res = super(observedbufferedinputpipe, self).read(size)

664

res = super(observedbufferedinputpipe, self).read(size)

665

666

fn = getattr(self._input._observer, 'bufferedread', None)

666

fn = getattr(self._input._observer, 'bufferedread', None)

667

if fn:

667

if fn:

668

fn(res, size)

668

fn(res, size)

669

670

return res

670

return res

671

672

def readline(self, *args, **kwargs):

672

def readline(self, *args, **kwargs):

673

res = super(observedbufferedinputpipe, self).readline(*args, **kwargs)

673

res = super(observedbufferedinputpipe, self).readline(*args, **kwargs)

674

675

fn = getattr(self._input._observer, 'bufferedreadline', None)

675

fn = getattr(self._input._observer, 'bufferedreadline', None)

676

if fn:

676

if fn:

677

fn(res)

677

fn(res)

678

679

return res

679

return res

680

681

682

PROXIED_SOCKET_METHODS = {

682

PROXIED_SOCKET_METHODS = {

683

'makefile',

683

'makefile',

684

'recv',

684

'recv',

685

'recvfrom',

685

'recvfrom',

686

'recvfrom_into',

686

'recvfrom_into',

687

'recv_into',

687

'recv_into',

688

'send',

688

'send',

689

'sendall',

689

'sendall',

690

'sendto',

690

'sendto',

691

'setblocking',

691

'setblocking',

692

'settimeout',

692

'settimeout',

693

'gettimeout',

693

'gettimeout',

694

'setsockopt',

694

'setsockopt',

695

}

695

}

696

697

698

class socketproxy(object):

698

class socketproxy(object):

699

"""A proxy around a socket that tells a watcher when events occur.

699

"""A proxy around a socket that tells a watcher when events occur.

700

701

This is like ``fileobjectproxy`` except for sockets.

701

This is like ``fileobjectproxy`` except for sockets.

702

703

This type is intended to only be used for testing purposes. Think hard

703

This type is intended to only be used for testing purposes. Think hard

704

before using it in important code.

704

before using it in important code.

705

"""

705

"""

706

707

__slots__ = (

707

__slots__ = (

708

'_orig',

708

'_orig',

709

'_observer',

709

'_observer',

710

)

710

)

711

712

def __init__(self, sock, observer):

712

def __init__(self, sock, observer):

713

object.__setattr__(self, '_orig', sock)

713

object.__setattr__(self, '_orig', sock)

714

object.__setattr__(self, '_observer', observer)

714

object.__setattr__(self, '_observer', observer)

715

716

def __getattribute__(self, name):

716

def __getattribute__(self, name):

717

if name in PROXIED_SOCKET_METHODS:

717

if name in PROXIED_SOCKET_METHODS:

718

return object.__getattribute__(self, name)

718

return object.__getattribute__(self, name)

719

720

return getattr(object.__getattribute__(self, '_orig'), name)

720

return getattr(object.__getattribute__(self, '_orig'), name)

721

722

def __delattr__(self, name):

722

def __delattr__(self, name):

723

return delattr(object.__getattribute__(self, '_orig'), name)

723

return delattr(object.__getattribute__(self, '_orig'), name)

724

725

def __setattr__(self, name, value):

725

def __setattr__(self, name, value):

726

return setattr(object.__getattribute__(self, '_orig'), name, value)

726

return setattr(object.__getattribute__(self, '_orig'), name, value)

727

728

def __nonzero__(self):

728

def __nonzero__(self):

729

return bool(object.__getattribute__(self, '_orig'))

729

return bool(object.__getattribute__(self, '_orig'))

730

731

__bool__ = __nonzero__

731

__bool__ = __nonzero__

732

733

def _observedcall(self, name, *args, **kwargs):

733

def _observedcall(self, name, *args, **kwargs):

734

# Call the original object.

734

# Call the original object.

735

orig = object.__getattribute__(self, '_orig')

735

orig = object.__getattribute__(self, '_orig')

736

res = getattr(orig, name)(*args, **kwargs)

736

res = getattr(orig, name)(*args, **kwargs)

737

738

# Call a method on the observer of the same name with arguments

738

# Call a method on the observer of the same name with arguments

739

# so it can react, log, etc.

739

# so it can react, log, etc.

740

observer = object.__getattribute__(self, '_observer')

740

observer = object.__getattribute__(self, '_observer')

741

fn = getattr(observer, name, None)

741

fn = getattr(observer, name, None)

742

if fn:

742

if fn:

743

fn(res, *args, **kwargs)

743

fn(res, *args, **kwargs)

744

745

return res

745

return res

746

747

def makefile(self, *args, **kwargs):

747

def makefile(self, *args, **kwargs):

748

res = object.__getattribute__(self, '_observedcall')(

748

res = object.__getattribute__(self, '_observedcall')(

749

'makefile', *args, **kwargs

749

'makefile', *args, **kwargs

750

)

750

)

751

752

# The file object may be used for I/O. So we turn it into a

752

# The file object may be used for I/O. So we turn it into a

753

# proxy using our observer.

753

# proxy using our observer.

754

observer = object.__getattribute__(self, '_observer')

754

observer = object.__getattribute__(self, '_observer')

755

return makeloggingfileobject(

755

return makeloggingfileobject(

756

observer.fh,

756

observer.fh,

757

res,

757

res,

758

observer.name,

758

observer.name,

759

reads=observer.reads,

759

reads=observer.reads,

760

writes=observer.writes,

760

writes=observer.writes,

761

logdata=observer.logdata,

761

logdata=observer.logdata,

762

logdataapis=observer.logdataapis,

762

logdataapis=observer.logdataapis,

763

)

763

)

764

765

def recv(self, *args, **kwargs):

765

def recv(self, *args, **kwargs):

766

return object.__getattribute__(self, '_observedcall')(

766

return object.__getattribute__(self, '_observedcall')(

767

'recv', *args, **kwargs

767

'recv', *args, **kwargs

768

)

768

)

769

770

def recvfrom(self, *args, **kwargs):

770

def recvfrom(self, *args, **kwargs):

771

return object.__getattribute__(self, '_observedcall')(

771

return object.__getattribute__(self, '_observedcall')(

772

'recvfrom', *args, **kwargs

772

'recvfrom', *args, **kwargs

773

)

773

)

774

775

def recvfrom_into(self, *args, **kwargs):

775

def recvfrom_into(self, *args, **kwargs):

776

return object.__getattribute__(self, '_observedcall')(

776

return object.__getattribute__(self, '_observedcall')(

777

'recvfrom_into', *args, **kwargs

777

'recvfrom_into', *args, **kwargs

778

)

778

)

779

780

def recv_into(self, *args, **kwargs):

780

def recv_into(self, *args, **kwargs):

781

return object.__getattribute__(self, '_observedcall')(

781

return object.__getattribute__(self, '_observedcall')(

782

'recv_info', *args, **kwargs

782

'recv_info', *args, **kwargs

783

)

783

)

784

785

def send(self, *args, **kwargs):

785

def send(self, *args, **kwargs):

786

return object.__getattribute__(self, '_observedcall')(

786

return object.__getattribute__(self, '_observedcall')(

787

'send', *args, **kwargs

787

'send', *args, **kwargs

788

)

788

)

789

790

def sendall(self, *args, **kwargs):

790

def sendall(self, *args, **kwargs):

791

return object.__getattribute__(self, '_observedcall')(

791

return object.__getattribute__(self, '_observedcall')(

792

'sendall', *args, **kwargs

792

'sendall', *args, **kwargs

793

)

793

)

794

795

def sendto(self, *args, **kwargs):

795

def sendto(self, *args, **kwargs):

796

return object.__getattribute__(self, '_observedcall')(

796

return object.__getattribute__(self, '_observedcall')(

797

'sendto', *args, **kwargs

797

'sendto', *args, **kwargs

798

)

798

)

799

800

def setblocking(self, *args, **kwargs):

800

def setblocking(self, *args, **kwargs):

801

return object.__getattribute__(self, '_observedcall')(

801

return object.__getattribute__(self, '_observedcall')(

802

'setblocking', *args, **kwargs

802

'setblocking', *args, **kwargs

803

)

803

)

804

805

def settimeout(self, *args, **kwargs):

805

def settimeout(self, *args, **kwargs):

806

return object.__getattribute__(self, '_observedcall')(

806

return object.__getattribute__(self, '_observedcall')(

807

'settimeout', *args, **kwargs

807

'settimeout', *args, **kwargs

808

)

808

)

809

810

def gettimeout(self, *args, **kwargs):

810

def gettimeout(self, *args, **kwargs):

811

return object.__getattribute__(self, '_observedcall')(

811

return object.__getattribute__(self, '_observedcall')(

812

'gettimeout', *args, **kwargs

812

'gettimeout', *args, **kwargs

813

)

813

)

814

815

def setsockopt(self, *args, **kwargs):

815

def setsockopt(self, *args, **kwargs):

816

return object.__getattribute__(self, '_observedcall')(

816

return object.__getattribute__(self, '_observedcall')(

817

'setsockopt', *args, **kwargs

817

'setsockopt', *args, **kwargs

818

)

818

)

819

820

821

class baseproxyobserver(object):

821

class baseproxyobserver(object):

822

def __init__(self, fh, name, logdata, logdataapis):

822

def __init__(self, fh, name, logdata, logdataapis):

823

self.fh = fh

823

self.fh = fh

824

self.name = name

824

self.name = name

825

self.logdata = logdata

825

self.logdata = logdata

826

self.logdataapis = logdataapis

826

self.logdataapis = logdataapis

827

828

def _writedata(self, data):

828

def _writedata(self, data):

829

if not self.logdata:

829

if not self.logdata:

830

if self.logdataapis:

830

if self.logdataapis:

831

self.fh.write(b'\n')

831

self.fh.write(b'\n')

832

self.fh.flush()

832

self.fh.flush()

833

return

833

return

834

835

# Simple case writes all data on a single line.

835

# Simple case writes all data on a single line.

836

if b'\n' not in data:

836

if b'\n' not in data:

837

if self.logdataapis:

837

if self.logdataapis:

838

self.fh.write(b': %s\n' % stringutil.escapestr(data))

838

self.fh.write(b': %s\n' % stringutil.escapestr(data))

839

else:

839

else:

840

self.fh.write(

840

self.fh.write(

841

b'%s> %s\n' % (self.name, stringutil.escapestr(data))

841

b'%s> %s\n' % (self.name, stringutil.escapestr(data))

842

)

842

)

843

self.fh.flush()

843

self.fh.flush()

844

return

844

return

845

846

# Data with newlines is written to multiple lines.

846

# Data with newlines is written to multiple lines.

847

if self.logdataapis:

847

if self.logdataapis:

848

self.fh.write(b':\n')

848

self.fh.write(b':\n')

849

850

lines = data.splitlines(True)

850

lines = data.splitlines(True)

851

for line in lines:

851

for line in lines:

852

self.fh.write(

852

self.fh.write(

853

b'%s> %s\n' % (self.name, stringutil.escapestr(line))

853

b'%s> %s\n' % (self.name, stringutil.escapestr(line))

854

)

854

)

855

self.fh.flush()

855

self.fh.flush()

856

857

858

class fileobjectobserver(baseproxyobserver):

858

class fileobjectobserver(baseproxyobserver):

859

"""Logs file object activity."""

859

"""Logs file object activity."""

860

861

def __init__(

861

def __init__(

862

self, fh, name, reads=True, writes=True, logdata=False, logdataapis=True

862

self, fh, name, reads=True, writes=True, logdata=False, logdataapis=True

863

):

863

):

864

super(fileobjectobserver, self).__init__(fh, name, logdata, logdataapis)

864

super(fileobjectobserver, self).__init__(fh, name, logdata, logdataapis)

865

self.reads = reads

865

self.reads = reads

866

self.writes = writes

866

self.writes = writes

867

868

def read(self, res, size=-1):

868

def read(self, res, size=-1):

869

if not self.reads:

869

if not self.reads:

870

return

870

return

871

# Python 3 can return None from reads at EOF instead of empty strings.

871

# Python 3 can return None from reads at EOF instead of empty strings.

872

if res is None:

872

if res is None:

873

res = b''

873

res = b''

874

875

if size == -1 and res == b'':

875

if size == -1 and res == b'':

876

# Suppress pointless read(-1) calls that return

876

# Suppress pointless read(-1) calls that return

877

# nothing. These happen _a lot_ on Python 3, and there

877

# nothing. These happen _a lot_ on Python 3, and there

878

# doesn't seem to be a better workaround to have matching

878

# doesn't seem to be a better workaround to have matching

879

# Python 2 and 3 behavior. :(

879

# Python 2 and 3 behavior. :(

880

return

880

return

881

882

if self.logdataapis:

882

if self.logdataapis:

883

self.fh.write(b'%s> read(%d) -> %d' % (self.name, size, len(res)))

883

self.fh.write(b'%s> read(%d) -> %d' % (self.name, size, len(res)))

884

885

self._writedata(res)

885

self._writedata(res)

886

887

def readline(self, res, limit=-1):

887

def readline(self, res, limit=-1):

888

if not self.reads:

888

if not self.reads:

889

return

889

return

890

891

if self.logdataapis:

891

if self.logdataapis:

892

self.fh.write(b'%s> readline() -> %d' % (self.name, len(res)))

892

self.fh.write(b'%s> readline() -> %d' % (self.name, len(res)))

893

894

self._writedata(res)

894

self._writedata(res)

895

896

def readinto(self, res, dest):

896

def readinto(self, res, dest):

897

if not self.reads:

897

if not self.reads:

898

return

898

return

899

900

if self.logdataapis:

900

if self.logdataapis:

901

self.fh.write(

901

self.fh.write(

902

b'%s> readinto(%d) -> %r' % (self.name, len(dest), res)

902

b'%s> readinto(%d) -> %r' % (self.name, len(dest), res)

903

)

903

)

904

905

data = dest[0:res] if res is not None else b''

905

data = dest[0:res] if res is not None else b''

906

907

# _writedata() uses "in" operator and is confused by memoryview because

907

# _writedata() uses "in" operator and is confused by memoryview because

908

# characters are ints on Python 3.

908

# characters are ints on Python 3.

909

if isinstance(data, memoryview):

909

if isinstance(data, memoryview):

910

data = data.tobytes()

910

data = data.tobytes()

911

912

self._writedata(data)

912

self._writedata(data)

913

914

def write(self, res, data):

914

def write(self, res, data):

915

if not self.writes:

915

if not self.writes:

916

return

916

return

917

918

# Python 2 returns None from some write() calls. Python 3 (reasonably)

918

# Python 2 returns None from some write() calls. Python 3 (reasonably)

919

# returns the integer bytes written.

919

# returns the integer bytes written.

920

if res is None and data:

920

if res is None and data:

921

res = len(data)

921

res = len(data)

922

923

if self.logdataapis:

923

if self.logdataapis:

924

self.fh.write(b'%s> write(%d) -> %r' % (self.name, len(data), res))

924

self.fh.write(b'%s> write(%d) -> %r' % (self.name, len(data), res))

925

926

self._writedata(data)

926

self._writedata(data)

927

928

def flush(self, res):

928

def flush(self, res):

929

if not self.writes:

929

if not self.writes:

930

return

930

return

931

932

self.fh.write(b'%s> flush() -> %r\n' % (self.name, res))

932

self.fh.write(b'%s> flush() -> %r\n' % (self.name, res))

933

934

# For observedbufferedinputpipe.

934

# For observedbufferedinputpipe.

935

def bufferedread(self, res, size):

935

def bufferedread(self, res, size):

936

if not self.reads:

936

if not self.reads:

937

return

937

return

938

939

if self.logdataapis:

939

if self.logdataapis:

940

self.fh.write(

940

self.fh.write(

941

b'%s> bufferedread(%d) -> %d' % (self.name, size, len(res))

941

b'%s> bufferedread(%d) -> %d' % (self.name, size, len(res))

942

)

942

)

943

944

self._writedata(res)

944

self._writedata(res)

945

946

def bufferedreadline(self, res):

946

def bufferedreadline(self, res):

947

if not self.reads:

947

if not self.reads:

948

return

948

return

949

950

if self.logdataapis:

950

if self.logdataapis:

951

self.fh.write(

951

self.fh.write(

952

b'%s> bufferedreadline() -> %d' % (self.name, len(res))

952

b'%s> bufferedreadline() -> %d' % (self.name, len(res))

953

)

953

)

954

955

self._writedata(res)

955

self._writedata(res)

956

957

958

def makeloggingfileobject(

958

def makeloggingfileobject(

959

logh, fh, name, reads=True, writes=True, logdata=False, logdataapis=True

959

logh, fh, name, reads=True, writes=True, logdata=False, logdataapis=True

960

):

960

):

961

"""Turn a file object into a logging file object."""

961

"""Turn a file object into a logging file object."""

962

963

observer = fileobjectobserver(

963

observer = fileobjectobserver(

964

logh,

964

logh,

965

name,

965

name,

966

reads=reads,

966

reads=reads,

967

writes=writes,

967

writes=writes,

968

logdata=logdata,

968

logdata=logdata,

969

logdataapis=logdataapis,

969

logdataapis=logdataapis,

970

)

970

)

971

return fileobjectproxy(fh, observer)

971

return fileobjectproxy(fh, observer)

972

973

974

class socketobserver(baseproxyobserver):

974

class socketobserver(baseproxyobserver):

975

"""Logs socket activity."""

975

"""Logs socket activity."""

976

977

def __init__(

977

def __init__(

978

self,

978

self,

979

fh,

979

fh,

980

name,

980

name,

981

reads=True,

981

reads=True,

982

writes=True,

982

writes=True,

983

states=True,

983

states=True,

984

logdata=False,

984

logdata=False,

985

logdataapis=True,

985

logdataapis=True,

986

):

986

):

987

super(socketobserver, self).__init__(fh, name, logdata, logdataapis)

987

super(socketobserver, self).__init__(fh, name, logdata, logdataapis)

988

self.reads = reads

988

self.reads = reads

989

self.writes = writes

989

self.writes = writes

990

self.states = states

990

self.states = states

991

992

def makefile(self, res, mode=None, bufsize=None):

992

def makefile(self, res, mode=None, bufsize=None):

993

if not self.states:

993

if not self.states:

994

return

994

return

995

996

self.fh.write(b'%s> makefile(%r, %r)\n' % (self.name, mode, bufsize))

996

self.fh.write(b'%s> makefile(%r, %r)\n' % (self.name, mode, bufsize))

997

998

def recv(self, res, size, flags=0):

998

def recv(self, res, size, flags=0):

999

if not self.reads:

999

if not self.reads:

1000

return

1000

return

1001

1002

if self.logdataapis:

1002

if self.logdataapis:

1003

self.fh.write(

1003

self.fh.write(

1004

b'%s> recv(%d, %d) -> %d' % (self.name, size, flags, len(res))

1004

b'%s> recv(%d, %d) -> %d' % (self.name, size, flags, len(res))

1005

)

1005

)

1006

self._writedata(res)

1006

self._writedata(res)

1007

1008

def recvfrom(self, res, size, flags=0):

1008

def recvfrom(self, res, size, flags=0):

1009

if not self.reads:

1009

if not self.reads:

1010

return

1010

return

1011

1012

if self.logdataapis:

1012

if self.logdataapis:

1013

self.fh.write(

1013

self.fh.write(

1014

b'%s> recvfrom(%d, %d) -> %d'

1014

b'%s> recvfrom(%d, %d) -> %d'

1015

% (self.name, size, flags, len(res[0]))

1015

% (self.name, size, flags, len(res[0]))

1016

)

1016

)

1017

1018

self._writedata(res[0])

1018

self._writedata(res[0])

1019

1020

def recvfrom_into(self, res, buf, size, flags=0):

1020

def recvfrom_into(self, res, buf, size, flags=0):

1021

if not self.reads:

1021

if not self.reads:

1022

return

1022

return

1023

1024

if self.logdataapis:

1024

if self.logdataapis:

1025

self.fh.write(

1025

self.fh.write(

1026

b'%s> recvfrom_into(%d, %d) -> %d'

1026

b'%s> recvfrom_into(%d, %d) -> %d'

1027

% (self.name, size, flags, res[0])

1027

% (self.name, size, flags, res[0])

1028

)

1028

)

1029

1030

self._writedata(buf[0 : res[0]])

1030

self._writedata(buf[0 : res[0]])

1031

1032

def recv_into(self, res, buf, size=0, flags=0):

1032

def recv_into(self, res, buf, size=0, flags=0):

1033

if not self.reads:

1033

if not self.reads:

1034

return

1034

return

1035

1036

if self.logdataapis:

1036

if self.logdataapis:

1037

self.fh.write(

1037

self.fh.write(

1038

b'%s> recv_into(%d, %d) -> %d' % (self.name, size, flags, res)

1038

b'%s> recv_into(%d, %d) -> %d' % (self.name, size, flags, res)

1039

)

1039

)

1040

1041

self._writedata(buf[0:res])

1041

self._writedata(buf[0:res])

1042

1043

def send(self, res, data, flags=0):

1043

def send(self, res, data, flags=0):

1044

if not self.writes:

1044

if not self.writes:

1045

return

1045

return

1046

1047

self.fh.write(

1047

self.fh.write(

1048

b'%s> send(%d, %d) -> %d' % (self.name, len(data), flags, len(res))

1048

b'%s> send(%d, %d) -> %d' % (self.name, len(data), flags, len(res))

1049

)

1049

)

1050

self._writedata(data)

1050

self._writedata(data)

1051

1052

def sendall(self, res, data, flags=0):

1052

def sendall(self, res, data, flags=0):

1053

if not self.writes:

1053

if not self.writes:

1054

return

1054

return

1055

1056

if self.logdataapis:

1056

if self.logdataapis:

1057

# Returns None on success. So don't bother reporting return value.

1057

# Returns None on success. So don't bother reporting return value.

1058

self.fh.write(

1058

self.fh.write(

1059

b'%s> sendall(%d, %d)' % (self.name, len(data), flags)

1059

b'%s> sendall(%d, %d)' % (self.name, len(data), flags)

1060

)

1060

)

1061

1062

self._writedata(data)

1062

self._writedata(data)

1063

1064

def sendto(self, res, data, flagsoraddress, address=None):

1064

def sendto(self, res, data, flagsoraddress, address=None):

1065

if not self.writes:

1065

if not self.writes:

1066

return

1066

return

1067

1068

if address:

1068

if address:

1069

flags = flagsoraddress

1069

flags = flagsoraddress

1070

else:

1070

else:

1071

flags = 0

1071

flags = 0

1072

1073

if self.logdataapis:

1073

if self.logdataapis:

1074

self.fh.write(

1074

self.fh.write(

1075

b'%s> sendto(%d, %d, %r) -> %d'

1075

b'%s> sendto(%d, %d, %r) -> %d'

1076

% (self.name, len(data), flags, address, res)

1076

% (self.name, len(data), flags, address, res)

1077

)

1077

)

1078

1079

self._writedata(data)

1079

self._writedata(data)

1080

1081

def setblocking(self, res, flag):

1081

def setblocking(self, res, flag):

1082

if not self.states:

1082

if not self.states:

1083

return

1083

return

1084

1085

self.fh.write(b'%s> setblocking(%r)\n' % (self.name, flag))

1085

self.fh.write(b'%s> setblocking(%r)\n' % (self.name, flag))

1086

1087

def settimeout(self, res, value):

1087

def settimeout(self, res, value):

1088

if not self.states:

1088

if not self.states:

1089

return

1089

return

1090

1091

self.fh.write(b'%s> settimeout(%r)\n' % (self.name, value))

1091

self.fh.write(b'%s> settimeout(%r)\n' % (self.name, value))

1092

1093

def gettimeout(self, res):

1093

def gettimeout(self, res):

1094

if not self.states:

1094

if not self.states:

1095

return

1095

return

1096

1097

self.fh.write(b'%s> gettimeout() -> %f\n' % (self.name, res))

1097

self.fh.write(b'%s> gettimeout() -> %f\n' % (self.name, res))

1098

1099

def setsockopt(self, res, level, optname, value):

1099

def setsockopt(self, res, level, optname, value):

1100

if not self.states:

1100

if not self.states:

1101

return

1101

return

1102

1103

self.fh.write(

1103

self.fh.write(

1104

b'%s> setsockopt(%r, %r, %r) -> %r\n'

1104

b'%s> setsockopt(%r, %r, %r) -> %r\n'

1105

% (self.name, level, optname, value, res)

1105

% (self.name, level, optname, value, res)

1106

)

1106

)

1107

1108

1109

def makeloggingsocket(

1109

def makeloggingsocket(

1110

logh,

1110

logh,

1111

fh,

1111

fh,

1112

name,

1112

name,

1113

reads=True,

1113

reads=True,

1114

writes=True,

1114

writes=True,

1115

states=True,

1115

states=True,

1116

logdata=False,

1116

logdata=False,

1117

logdataapis=True,

1117

logdataapis=True,

1118

):

1118

):

1119

"""Turn a socket into a logging socket."""

1119

"""Turn a socket into a logging socket."""

1120

1121

observer = socketobserver(

1121

observer = socketobserver(

1122

logh,

1122

logh,

1123

name,

1123

name,

1124

reads=reads,

1124

reads=reads,

1125

writes=writes,

1125

writes=writes,

1126

states=states,

1126

states=states,

1127

logdata=logdata,

1127

logdata=logdata,

1128

logdataapis=logdataapis,

1128

logdataapis=logdataapis,

1129

)

1129

)

1130

return socketproxy(fh, observer)

1130

return socketproxy(fh, observer)

1131

1132

1133

def version():

1133

def version():

1134

"""Return version information if available."""

1134

"""Return version information if available."""

1135

try:

1135

try:

1136

from . import __version__

1136

from . import __version__

1137

1138

return __version__.version

1138

return __version__.version

1139

except ImportError:

1139

except ImportError:

1140

return b'unknown'

1140

return b'unknown'

1141

1142

1143

def versiontuple(v=None, n=4):

1143

def versiontuple(v=None, n=4):

1144

"""Parses a Mercurial version string into an N-tuple.

1144

"""Parses a Mercurial version string into an N-tuple.

1145

1146

The version string to be parsed is specified with the ``v`` argument.

1146

The version string to be parsed is specified with the ``v`` argument.

1147

If it isn't defined, the current Mercurial version string will be parsed.

1147

If it isn't defined, the current Mercurial version string will be parsed.

1148

1149

``n`` can be 2, 3, or 4. Here is how some version strings map to

1149

``n`` can be 2, 3, or 4. Here is how some version strings map to

1150

returned values:

1150

returned values:

1151

1152

>>> v = b'3.6.1+190-df9b73d2d444'

1152

>>> v = b'3.6.1+190-df9b73d2d444'

1153

>>> versiontuple(v, 2)

1153

>>> versiontuple(v, 2)

1154

(3, 6)

1154

(3, 6)

1155

>>> versiontuple(v, 3)

1155

>>> versiontuple(v, 3)

1156

(3, 6, 1)

1156

(3, 6, 1)

1157

>>> versiontuple(v, 4)

1157

>>> versiontuple(v, 4)

1158

(3, 6, 1, '190-df9b73d2d444')

1158

(3, 6, 1, '190-df9b73d2d444')

1159

1160

>>> versiontuple(b'3.6.1+190-df9b73d2d444+20151118')

1160

>>> versiontuple(b'3.6.1+190-df9b73d2d444+20151118')

1161

(3, 6, 1, '190-df9b73d2d444+20151118')

1161

(3, 6, 1, '190-df9b73d2d444+20151118')

1162

1163

>>> v = b'3.6'

1163

>>> v = b'3.6'

1164

>>> versiontuple(v, 2)

1164

>>> versiontuple(v, 2)

1165

(3, 6)

1165

(3, 6)

1166

>>> versiontuple(v, 3)

1166

>>> versiontuple(v, 3)

1167

(3, 6, None)

1167

(3, 6, None)

1168

>>> versiontuple(v, 4)

1168

>>> versiontuple(v, 4)

1169

(3, 6, None, None)

1169

(3, 6, None, None)

1170

1171

>>> v = b'3.9-rc'

1171

>>> v = b'3.9-rc'

1172

>>> versiontuple(v, 2)

1172

>>> versiontuple(v, 2)

1173

(3, 9)

1173

(3, 9)

1174

>>> versiontuple(v, 3)

1174

>>> versiontuple(v, 3)

1175

(3, 9, None)

1175

(3, 9, None)

1176

>>> versiontuple(v, 4)

1176

>>> versiontuple(v, 4)

1177

(3, 9, None, 'rc')

1177

(3, 9, None, 'rc')

1178

1179

>>> v = b'3.9-rc+2-02a8fea4289b'

1179

>>> v = b'3.9-rc+2-02a8fea4289b'

1180

>>> versiontuple(v, 2)

1180

>>> versiontuple(v, 2)

1181

(3, 9)

1181

(3, 9)

1182

>>> versiontuple(v, 3)

1182

>>> versiontuple(v, 3)

1183

(3, 9, None)

1183

(3, 9, None)

1184

>>> versiontuple(v, 4)

1184

>>> versiontuple(v, 4)

1185

(3, 9, None, 'rc+2-02a8fea4289b')

1185

(3, 9, None, 'rc+2-02a8fea4289b')

1186

1187

>>> versiontuple(b'4.6rc0')

1187

>>> versiontuple(b'4.6rc0')

1188

(4, 6, None, 'rc0')

1188

(4, 6, None, 'rc0')

1189

>>> versiontuple(b'4.6rc0+12-425d55e54f98')

1189

>>> versiontuple(b'4.6rc0+12-425d55e54f98')

1190

(4, 6, None, 'rc0+12-425d55e54f98')

1190

(4, 6, None, 'rc0+12-425d55e54f98')

1191

>>> versiontuple(b'.1.2.3')

1191

>>> versiontuple(b'.1.2.3')

1192

(None, None, None, '.1.2.3')

1192

(None, None, None, '.1.2.3')

1193

>>> versiontuple(b'12.34..5')

1193

>>> versiontuple(b'12.34..5')

1194

(12, 34, None, '..5')

1194

(12, 34, None, '..5')

1195

>>> versiontuple(b'1.2.3.4.5.6')

1195

>>> versiontuple(b'1.2.3.4.5.6')

1196

(1, 2, 3, '.4.5.6')

1196

(1, 2, 3, '.4.5.6')

1197

"""

1197

"""

1198

if not v:

1198

if not v:

1199

v = version()

1199

v = version()

1200

m = remod.match(br'(\d+(?:\.\d+){,2})[+-]?(.*)', v)

1200

m = remod.match(br'(\d+(?:\.\d+){,2})[+-]?(.*)', v)

1201

if not m:

1201

if not m:

1202

vparts, extra = b'', v

1202

vparts, extra = b'', v

1203

elif m.group(2):

1203

elif m.group(2):

1204

vparts, extra = m.groups()

1204

vparts, extra = m.groups()

1205

else:

1205

else:

1206

vparts, extra = m.group(1), None

1206

vparts, extra = m.group(1), None

1207

1208

assert vparts is not None # help pytype

1208

assert vparts is not None # help pytype

1209

1210

vints = []

1210

vints = []

1211

for i in vparts.split(b'.'):

1211

for i in vparts.split(b'.'):

1212

try:

1212

try:

1213

vints.append(int(i))

1213

vints.append(int(i))

1214

except ValueError:

1214

except ValueError:

1215

break

1215

break

1216

# (3, 6) -> (3, 6, None)

1216

# (3, 6) -> (3, 6, None)

1217

while len(vints) < 3:

1217

while len(vints) < 3:

1218

vints.append(None)

1218

vints.append(None)

1219

1220

if n == 2:

1220

if n == 2:

1221

return (vints[0], vints[1])

1221

return (vints[0], vints[1])

1222

if n == 3:

1222

if n == 3:

1223

return (vints[0], vints[1], vints[2])

1223

return (vints[0], vints[1], vints[2])

1224

if n == 4:

1224

if n == 4:

1225

return (vints[0], vints[1], vints[2], extra)

1225

return (vints[0], vints[1], vints[2], extra)

1226

1227

1228

def cachefunc(func):

1228

def cachefunc(func):

1229

'''cache the result of function calls'''

1229

'''cache the result of function calls'''

1230

# XXX doesn't handle keywords args

1230

# XXX doesn't handle keywords args

1231

if func.__code__.co_argcount == 0:

1231

if func.__code__.co_argcount == 0:

1232

listcache = []

1232

listcache = []

1233

1234

def f():

1234

def f():

1235

if len(listcache) == 0:

1235

if len(listcache) == 0:

1236

listcache.append(func())

1236

listcache.append(func())

1237

return listcache[0]

1237

return listcache[0]

1238

1239

return f

1239

return f

1240

cache = {}

1240

cache = {}

1241

if func.__code__.co_argcount == 1:

1241

if func.__code__.co_argcount == 1:

1242

# we gain a small amount of time because

1242

# we gain a small amount of time because

1243

# we don't need to pack/unpack the list

1243

# we don't need to pack/unpack the list

1244

def f(arg):

1244

def f(arg):

1245

if arg not in cache:

1245

if arg not in cache:

1246

cache[arg] = func(arg)

1246

cache[arg] = func(arg)

1247

return cache[arg]

1247

return cache[arg]

1248

1249

else:

1249

else:

1250

1251

def f(*args):

1251

def f(*args):

1252

if args not in cache:

1252

if args not in cache:

1253

cache[args] = func(*args)

1253

cache[args] = func(*args)

1254

return cache[args]

1254

return cache[args]

1255

1256

return f

1256

return f

1257

1258

1259

class cow(object):

1259

class cow(object):

1260

"""helper class to make copy-on-write easier

1260

"""helper class to make copy-on-write easier

1261

1262

Call preparewrite before doing any writes.

1262

Call preparewrite before doing any writes.

1263

"""

1263

"""

1264

1265

def preparewrite(self):

1265

def preparewrite(self):

1266

"""call this before writes, return self or a copied new object"""

1266

"""call this before writes, return self or a copied new object"""

1267

if getattr(self, '_copied', 0):

1267

if getattr(self, '_copied', 0):

1268

self._copied -= 1

1268

self._copied -= 1

1269

# Function cow.__init__ expects 1 arg(s), got 2 [wrong-arg-count]

1269

# Function cow.__init__ expects 1 arg(s), got 2 [wrong-arg-count]

1270

return self.__class__(self) # pytype: disable=wrong-arg-count

1270

return self.__class__(self) # pytype: disable=wrong-arg-count

1271

return self

1271

return self

1272

1273

def copy(self):

1273

def copy(self):

1274

"""always do a cheap copy"""

1274

"""always do a cheap copy"""

1275

self._copied = getattr(self, '_copied', 0) + 1

1275

self._copied = getattr(self, '_copied', 0) + 1

1276

return self

1276

return self

1277

1278

1279

class sortdict(collections.OrderedDict):

1279

class sortdict(collections.OrderedDict):

1280

"""a simple sorted dictionary

1280

"""a simple sorted dictionary

1281

1282

>>> d1 = sortdict([(b'a', 0), (b'b', 1)])

1282

>>> d1 = sortdict([(b'a', 0), (b'b', 1)])

1283

>>> d2 = d1.copy()

1283

>>> d2 = d1.copy()

1284

>>> d2

1284

>>> d2

1285

sortdict([('a', 0), ('b', 1)])

1285

sortdict([('a', 0), ('b', 1)])

1286

>>> d2.update([(b'a', 2)])

1286

>>> d2.update([(b'a', 2)])

1287

>>> list(d2.keys()) # should still be in last-set order

1287

>>> list(d2.keys()) # should still be in last-set order

1288

['b', 'a']

1288

['b', 'a']

1289

>>> d1.insert(1, b'a.5', 0.5)

1289

>>> d1.insert(1, b'a.5', 0.5)

1290

>>> d1

1290

>>> d1

1291

sortdict([('a', 0), ('a.5', 0.5), ('b', 1)])

1291

sortdict([('a', 0), ('a.5', 0.5), ('b', 1)])

1292

"""

1292

"""

1293

1294

def __setitem__(self, key, value):

1294

def __setitem__(self, key, value):

1295

if key in self:

1295

if key in self:

1296

del self[key]

1296

del self[key]

1297

super(sortdict, self).__setitem__(key, value)

1297

super(sortdict, self).__setitem__(key, value)

1298

1299

if pycompat.ispypy:

1299

if pycompat.ispypy:

1300

# __setitem__() isn't called as of PyPy 5.8.0

1300

# __setitem__() isn't called as of PyPy 5.8.0

1301

def update(self, src, **f):

1301

def update(self, src, **f):

1302

if isinstance(src, dict):

1302

if isinstance(src, dict):

1303

src = pycompat.iteritems(src)

1303

src = pycompat.iteritems(src)

1304

for k, v in src:

1304

for k, v in src:

1305

self[k] = v

1305

self[k] = v

1306

for k in f:

1306

for k in f:

1307

self[k] = f[k]

1307

self[k] = f[k]

1308

1309

def insert(self, position, key, value):

1309

def insert(self, position, key, value):

1310

for (i, (k, v)) in enumerate(list(self.items())):

1310

for (i, (k, v)) in enumerate(list(self.items())):

1311

if i == position:

1311

if i == position:

1312

self[key] = value

1312

self[key] = value

1313

if i >= position:

1313

if i >= position:

1314

del self[k]

1314

del self[k]

1315

self[k] = v

1315

self[k] = v

1316

1317

1318

class cowdict(cow, dict):

1318

class cowdict(cow, dict):

1319

"""copy-on-write dict

1319

"""copy-on-write dict

1320

1321

Be sure to call d = d.preparewrite() before writing to d.

1321

Be sure to call d = d.preparewrite() before writing to d.

1322

1323

>>> a = cowdict()

1323

>>> a = cowdict()

1324

>>> a is a.preparewrite()

1324

>>> a is a.preparewrite()

1325

True

1325

True

1326

>>> b = a.copy()

1326

>>> b = a.copy()

1327

>>> b is a

1327

>>> b is a

1328

True

1328

True

1329

>>> c = b.copy()

1329

>>> c = b.copy()

1330

>>> c is a

1330

>>> c is a

1331

True

1331

True

1332

>>> a = a.preparewrite()

1332

>>> a = a.preparewrite()

1333

>>> b is a

1333

>>> b is a

1334

False

1334

False

1335

>>> a is a.preparewrite()

1335

>>> a is a.preparewrite()

1336

True

1336

True

1337

>>> c = c.preparewrite()

1337

>>> c = c.preparewrite()

1338

>>> b is c

1338

>>> b is c

1339

False

1339

False

1340

>>> b is b.preparewrite()

1340

>>> b is b.preparewrite()

1341

True

1341

True

1342

"""

1342

"""

1343

1344

1345

class cowsortdict(cow, sortdict):

1345

class cowsortdict(cow, sortdict):

1346

"""copy-on-write sortdict

1346

"""copy-on-write sortdict

1347

1348

Be sure to call d = d.preparewrite() before writing to d.

1348

Be sure to call d = d.preparewrite() before writing to d.

1349

"""

1349

"""

1350

1351

1352

class transactional(object): # pytype: disable=ignored-metaclass

1352

class transactional(object): # pytype: disable=ignored-metaclass

1353

"""Base class for making a transactional type into a context manager."""

1353

"""Base class for making a transactional type into a context manager."""

1354

1355

__metaclass__ = abc.ABCMeta

1355

__metaclass__ = abc.ABCMeta

1356

1357

@abc.abstractmethod

1357

@abc.abstractmethod

1358

def close(self):

1358

def close(self):

1359

"""Successfully closes the transaction."""

1359

"""Successfully closes the transaction."""

1360

1361

@abc.abstractmethod

1361

@abc.abstractmethod

1362

def release(self):

1362

def release(self):

1363

"""Marks the end of the transaction.

1363

"""Marks the end of the transaction.

1364

1365

If the transaction has not been closed, it will be aborted.

1365

If the transaction has not been closed, it will be aborted.

1366

"""

1366

"""

1367

1368

def __enter__(self):

1368

def __enter__(self):

1369

return self

1369

return self

1370

1371

def __exit__(self, exc_type, exc_val, exc_tb):

1371

def __exit__(self, exc_type, exc_val, exc_tb):

1372

try:

1372

try:

1373

if exc_type is None:

1373

if exc_type is None:

1374

self.close()

1374

self.close()

1375

finally:

1375

finally:

1376

self.release()

1376

self.release()

1377

1378

1379

@contextlib.contextmanager

1379

@contextlib.contextmanager

1380

def acceptintervention(tr=None):

1380

def acceptintervention(tr=None):

1381

"""A context manager that closes the transaction on InterventionRequired

1381

"""A context manager that closes the transaction on InterventionRequired

1382

1383

If no transaction was provided, this simply runs the body and returns

1383

If no transaction was provided, this simply runs the body and returns

1384

"""

1384

"""

1385

if not tr:

1385

if not tr:

1386

yield

1386

yield

1387

return

1387

return

1388

try:

1388

try:

1389

yield

1389

yield

1390

tr.close()

1390

tr.close()

1391

except error.InterventionRequired:

1391

except error.InterventionRequired:

1392

tr.close()

1392

tr.close()

1393

raise

1393

raise

1394

finally:

1394

finally:

1395

tr.release()

1395

tr.release()

1396

1397

1398

@contextlib.contextmanager

1398

@contextlib.contextmanager

1399

def nullcontextmanager(enter_result=None):

1399

def nullcontextmanager(enter_result=None):

1400

yield enter_result

1400

yield enter_result

1401

1402

1403

class _lrucachenode(object):

1403

class _lrucachenode(object):

1404

"""A node in a doubly linked list.

1404

"""A node in a doubly linked list.

1405

1406

Holds a reference to nodes on either side as well as a key-value

1406

Holds a reference to nodes on either side as well as a key-value

1407

pair for the dictionary entry.

1407

pair for the dictionary entry.

1408

"""

1408

"""

1409

1410

__slots__ = ('next', 'prev', 'key', 'value', 'cost')

1410

__slots__ = ('next', 'prev', 'key', 'value', 'cost')

1411

1412

def __init__(self):

1412

def __init__(self):

1413

self.next = self

1413

self.next = self

1414

self.prev = self

1414

self.prev = self

1415

1416

self.key = _notset

1416

self.key = _notset

1417

self.value = None

1417

self.value = None

1418

self.cost = 0

1418

self.cost = 0

1419

1420

def markempty(self):

1420

def markempty(self):

1421

"""Mark the node as emptied."""

1421

"""Mark the node as emptied."""

1422

self.key = _notset

1422

self.key = _notset

1423

self.value = None

1423

self.value = None

1424

self.cost = 0

1424

self.cost = 0

1425

1426

1427

class lrucachedict(object):

1427

class lrucachedict(object):

1428

"""Dict that caches most recent accesses and sets.

1428

"""Dict that caches most recent accesses and sets.

1429

1430

The dict consists of an actual backing dict - indexed by original

1430

The dict consists of an actual backing dict - indexed by original

1431

key - and a doubly linked circular list defining the order of entries in

1431

key - and a doubly linked circular list defining the order of entries in

1432

the cache.

1432

the cache.

1433

1434

The head node is the newest entry in the cache. If the cache is full,

1434

The head node is the newest entry in the cache. If the cache is full,

1435

we recycle head.prev and make it the new head. Cache accesses result in

1435

we recycle head.prev and make it the new head. Cache accesses result in

1436

the node being moved to before the existing head and being marked as the

1436

the node being moved to before the existing head and being marked as the

1437

new head node.

1437

new head node.

1438

1439

Items in the cache can be inserted with an optional "cost" value. This is

1439

Items in the cache can be inserted with an optional "cost" value. This is

1440

simply an integer that is specified by the caller. The cache can be queried

1440

simply an integer that is specified by the caller. The cache can be queried

1441

for the total cost of all items presently in the cache.

1441

for the total cost of all items presently in the cache.

1442

1443

The cache can also define a maximum cost. If a cache insertion would

1443

The cache can also define a maximum cost. If a cache insertion would

1444

cause the total cost of the cache to go beyond the maximum cost limit,

1444

cause the total cost of the cache to go beyond the maximum cost limit,

1445

nodes will be evicted to make room for the new code. This can be used

1445

nodes will be evicted to make room for the new code. This can be used

1446

to e.g. set a max memory limit and associate an estimated bytes size

1446

to e.g. set a max memory limit and associate an estimated bytes size

1447

cost to each item in the cache. By default, no maximum cost is enforced.

1447

cost to each item in the cache. By default, no maximum cost is enforced.

1448

"""

1448

"""

1449

1450

def __init__(self, max, maxcost=0):

1450

def __init__(self, max, maxcost=0):

1451

self._cache = {}

1451

self._cache = {}

1452

1453

self._head = _lrucachenode()

1453

self._head = _lrucachenode()

1454

self._size = 1

1454

self._size = 1

1455

self.capacity = max

1455

self.capacity = max

1456

self.totalcost = 0

1456

self.totalcost = 0

1457

self.maxcost = maxcost

1457

self.maxcost = maxcost

1458

1459

def __len__(self):

1459

def __len__(self):

1460

return len(self._cache)

1460

return len(self._cache)

1461

1462

def __contains__(self, k):

1462

def __contains__(self, k):

1463

return k in self._cache

1463

return k in self._cache

1464

1465

def __iter__(self):

1465

def __iter__(self):

1466

# We don't have to iterate in cache order, but why not.

1466

# We don't have to iterate in cache order, but why not.

1467

n = self._head

1467

n = self._head

1468

for i in range(len(self._cache)):

1468

for i in range(len(self._cache)):

1469

yield n.key

1469

yield n.key

1470

n = n.next

1470

n = n.next

1471

1472

def __getitem__(self, k):

1472

def __getitem__(self, k):

1473

node = self._cache[k]

1473

node = self._cache[k]

1474

self._movetohead(node)

1474

self._movetohead(node)

1475

return node.value

1475

return node.value

1476

1477

def insert(self, k, v, cost=0):

1477

def insert(self, k, v, cost=0):

1478

"""Insert a new item in the cache with optional cost value."""

1478

"""Insert a new item in the cache with optional cost value."""

1479

node = self._cache.get(k)

1479

node = self._cache.get(k)

1480

# Replace existing value and mark as newest.

1480

# Replace existing value and mark as newest.

1481

if node is not None:

1481

if node is not None:

1482

self.totalcost -= node.cost

1482

self.totalcost -= node.cost

1483

node.value = v

1483

node.value = v

1484

node.cost = cost

1484

node.cost = cost

1485

self.totalcost += cost

1485

self.totalcost += cost

1486

self._movetohead(node)

1486

self._movetohead(node)

1487

1488

if self.maxcost:

1488

if self.maxcost:

1489

self._enforcecostlimit()

1489

self._enforcecostlimit()

1490

1491

return

1491

return

1492

1493

if self._size < self.capacity:

1493

if self._size < self.capacity:

1494

node = self._addcapacity()

1494

node = self._addcapacity()

1495

else:

1495

else:

1496

# Grab the last/oldest item.

1496

# Grab the last/oldest item.

1497

node = self._head.prev

1497

node = self._head.prev

1498

1499

# At capacity. Kill the old entry.

1499

# At capacity. Kill the old entry.

1500

if node.key is not _notset:

1500

if node.key is not _notset:

1501

self.totalcost -= node.cost

1501

self.totalcost -= node.cost

1502

del self._cache[node.key]

1502

del self._cache[node.key]

1503

1504

node.key = k

1504

node.key = k

1505

node.value = v

1505

node.value = v

1506

node.cost = cost

1506

node.cost = cost

1507

self.totalcost += cost

1507

self.totalcost += cost

1508

self._cache[k] = node

1508

self._cache[k] = node

1509

# And mark it as newest entry. No need to adjust order since it

1509

# And mark it as newest entry. No need to adjust order since it

1510

# is already self._head.prev.

1510

# is already self._head.prev.

1511

self._head = node

1511

self._head = node

1512

1513

if self.maxcost:

1513

if self.maxcost:

1514

self._enforcecostlimit()

1514

self._enforcecostlimit()

1515

1516

def __setitem__(self, k, v):

1516

def __setitem__(self, k, v):

1517

self.insert(k, v)

1517

self.insert(k, v)

1518

1519

def __delitem__(self, k):

1519

def __delitem__(self, k):

1520

self.pop(k)

1520

self.pop(k)

1521

1522

def pop(self, k, default=_notset):

1522

def pop(self, k, default=_notset):

1523

try:

1523

try:

1524

node = self._cache.pop(k)

1524

node = self._cache.pop(k)

1525

except KeyError:

1525

except KeyError:

1526

if default is _notset:

1526

if default is _notset:

1527

raise

1527

raise

1528

return default

1528

return default

1529

1530

assert node is not None # help pytype

1530

assert node is not None # help pytype

1531

value = node.value

1531

value = node.value

1532

self.totalcost -= node.cost

1532

self.totalcost -= node.cost

1533

node.markempty()

1533

node.markempty()

1534

1535

# Temporarily mark as newest item before re-adjusting head to make

1535

# Temporarily mark as newest item before re-adjusting head to make

1536

# this node the oldest item.

1536

# this node the oldest item.

1537

self._movetohead(node)

1537

self._movetohead(node)

1538

self._head = node.next

1538

self._head = node.next

1539

1540

return value

1540

return value

1541

1542

# Additional dict methods.

1542

# Additional dict methods.

1543

1544

def get(self, k, default=None):

1544

def get(self, k, default=None):

1545

try:

1545

try:

1546

return self.__getitem__(k)

1546

return self.__getitem__(k)

1547

except KeyError:

1547

except KeyError:

1548

return default

1548

return default

1549

1550

def peek(self, k, default=_notset):

1550

def peek(self, k, default=_notset):

1551

"""Get the specified item without moving it to the head

1551

"""Get the specified item without moving it to the head

1552

1553

Unlike get(), this doesn't mutate the internal state. But be aware

1553

Unlike get(), this doesn't mutate the internal state. But be aware

1554

that it doesn't mean peek() is thread safe.

1554

that it doesn't mean peek() is thread safe.

1555

"""

1555

"""

1556

try:

1556

try:

1557

node = self._cache[k]

1557

node = self._cache[k]

1558

assert node is not None # help pytype

1558

assert node is not None # help pytype

1559

return node.value

1559

return node.value

1560

except KeyError:

1560

except KeyError:

1561

if default is _notset:

1561

if default is _notset:

1562

raise

1562

raise

1563

return default

1563

return default

1564

1565

def clear(self):

1565

def clear(self):

1566

n = self._head

1566

n = self._head

1567

while n.key is not _notset:

1567

while n.key is not _notset:

1568

self.totalcost -= n.cost

1568

self.totalcost -= n.cost

1569

n.markempty()

1569

n.markempty()

1570

n = n.next

1570

n = n.next

1571

1572

self._cache.clear()

1572

self._cache.clear()

1573

1574

def copy(self, capacity=None, maxcost=0):

1574

def copy(self, capacity=None, maxcost=0):

1575

"""Create a new cache as a copy of the current one.

1575

"""Create a new cache as a copy of the current one.

1576

1577

By default, the new cache has the same capacity as the existing one.

1577

By default, the new cache has the same capacity as the existing one.

1578

But, the cache capacity can be changed as part of performing the

1578

But, the cache capacity can be changed as part of performing the

1579

copy.

1579

copy.

1580

1581

Items in the copy have an insertion/access order matching this

1581

Items in the copy have an insertion/access order matching this

1582

instance.

1582

instance.

1583

"""

1583

"""

1584

1585

capacity = capacity or self.capacity

1585

capacity = capacity or self.capacity

1586

maxcost = maxcost or self.maxcost

1586

maxcost = maxcost or self.maxcost

1587

result = lrucachedict(capacity, maxcost=maxcost)

1587

result = lrucachedict(capacity, maxcost=maxcost)

1588

1589

# We copy entries by iterating in oldest-to-newest order so the copy

1589

# We copy entries by iterating in oldest-to-newest order so the copy

1590

# has the correct ordering.

1590

# has the correct ordering.

1591

1592

# Find the first non-empty entry.

1592

# Find the first non-empty entry.

1593

n = self._head.prev

1593

n = self._head.prev

1594

while n.key is _notset and n is not self._head:

1594

while n.key is _notset and n is not self._head:

1595

n = n.prev

1595

n = n.prev

1596

1597

# We could potentially skip the first N items when decreasing capacity.

1597

# We could potentially skip the first N items when decreasing capacity.

1598

# But let's keep it simple unless it is a performance problem.

1598

# But let's keep it simple unless it is a performance problem.

1599

for i in range(len(self._cache)):

1599

for i in range(len(self._cache)):

1600

result.insert(n.key, n.value, cost=n.cost)

1600

result.insert(n.key, n.value, cost=n.cost)

1601

n = n.prev

1601

n = n.prev

1602

1603

return result

1603

return result

1604

1605

def popoldest(self):

1605

def popoldest(self):

1606

"""Remove the oldest item from the cache.

1606

"""Remove the oldest item from the cache.

1607

1608

Returns the (key, value) describing the removed cache entry.

1608

Returns the (key, value) describing the removed cache entry.

1609

"""

1609

"""

1610

if not self._cache:

1610

if not self._cache:

1611

return

1611

return

1612

1613

# Walk the linked list backwards starting at tail node until we hit

1613

# Walk the linked list backwards starting at tail node until we hit

1614

# a non-empty node.

1614

# a non-empty node.

1615

n = self._head.prev

1615

n = self._head.prev

1616

1617

assert n is not None # help pytype

1617

assert n is not None # help pytype

1618

1619

while n.key is _notset:

1619

while n.key is _notset:

1620

n = n.prev

1620

n = n.prev

1621

1622

assert n is not None # help pytype

1622

assert n is not None # help pytype

1623

1624

key, value = n.key, n.value

1624

key, value = n.key, n.value

1625

1626

# And remove it from the cache and mark it as empty.

1626

# And remove it from the cache and mark it as empty.

1627

del self._cache[n.key]

1627

del self._cache[n.key]

1628

self.totalcost -= n.cost

1628

self.totalcost -= n.cost

1629

n.markempty()

1629

n.markempty()

1630

1631

return key, value

1631

return key, value

1632

1633

def _movetohead(self, node):

1633

def _movetohead(self, node):

1634

"""Mark a node as the newest, making it the new head.

1634

"""Mark a node as the newest, making it the new head.

1635

1636

When a node is accessed, it becomes the freshest entry in the LRU

1636

When a node is accessed, it becomes the freshest entry in the LRU

1637

list, which is denoted by self._head.

1637

list, which is denoted by self._head.

1638

1639

Visually, let's make ``N`` the new head node (* denotes head):

1639

Visually, let's make ``N`` the new head node (* denotes head):

1640

1641

previous/oldest <-> head <-> next/next newest

1641

previous/oldest <-> head <-> next/next newest

1642

1643

----<->--- A* ---<->-----

1643

----<->--- A* ---<->-----

1644

| |

1644

| |

1645

E <-> D <-> N <-> C <-> B

1645

E <-> D <-> N <-> C <-> B

1646

1647

To:

1647

To:

1648

1649

----<->--- N* ---<->-----

1649

----<->--- N* ---<->-----

1650

| |

1650

| |

1651

E <-> D <-> C <-> B <-> A

1651

E <-> D <-> C <-> B <-> A

1652

1653

This requires the following moves:

1653

This requires the following moves:

1654

1655

C.next = D (node.prev.next = node.next)

1655

C.next = D (node.prev.next = node.next)

1656

D.prev = C (node.next.prev = node.prev)

1656

D.prev = C (node.next.prev = node.prev)

1657

E.next = N (head.prev.next = node)

1657

E.next = N (head.prev.next = node)

1658

N.prev = E (node.prev = head.prev)

1658

N.prev = E (node.prev = head.prev)

1659

N.next = A (node.next = head)

1659

N.next = A (node.next = head)

1660

A.prev = N (head.prev = node)

1660

A.prev = N (head.prev = node)

1661

"""

1661

"""

1662

head = self._head

1662

head = self._head

1663

# C.next = D

1663

# C.next = D

1664

node.prev.next = node.next

1664

node.prev.next = node.next

1665

# D.prev = C

1665

# D.prev = C

1666

node.next.prev = node.prev

1666

node.next.prev = node.prev

1667

# N.prev = E

1667

# N.prev = E

1668

node.prev = head.prev

1668

node.prev = head.prev

1669

# N.next = A

1669

# N.next = A

1670

# It is tempting to do just "head" here, however if node is

1670

# It is tempting to do just "head" here, however if node is

1671

# adjacent to head, this will do bad things.

1671

# adjacent to head, this will do bad things.

1672

node.next = head.prev.next

1672

node.next = head.prev.next

1673

# E.next = N

1673

# E.next = N

1674

node.next.prev = node

1674

node.next.prev = node

1675

# A.prev = N

1675

# A.prev = N

1676

node.prev.next = node

1676

node.prev.next = node

1677

1678

self._head = node

1678

self._head = node

1679

1680

def _addcapacity(self):

1680

def _addcapacity(self):

1681

"""Add a node to the circular linked list.

1681

"""Add a node to the circular linked list.

1682

1683

The new node is inserted before the head node.

1683

The new node is inserted before the head node.

1684

"""

1684

"""

1685

head = self._head

1685

head = self._head

1686

node = _lrucachenode()

1686

node = _lrucachenode()

1687

head.prev.next = node

1687

head.prev.next = node

1688

node.prev = head.prev

1688

node.prev = head.prev

1689

node.next = head

1689

node.next = head

1690

head.prev = node

1690

head.prev = node

1691

self._size += 1

1691

self._size += 1

1692

return node

1692

return node

1693

1694

def _enforcecostlimit(self):

1694

def _enforcecostlimit(self):

1695

# This should run after an insertion. It should only be called if total

1695

# This should run after an insertion. It should only be called if total

1696

# cost limits are being enforced.

1696

# cost limits are being enforced.

1697

# The most recently inserted node is never evicted.

1697

# The most recently inserted node is never evicted.

1698

if len(self) <= 1 or self.totalcost <= self.maxcost:

1698

if len(self) <= 1 or self.totalcost <= self.maxcost:

1699

return

1699

return

1700

1701

# This is logically equivalent to calling popoldest() until we

1701

# This is logically equivalent to calling popoldest() until we

1702

# free up enough cost. We don't do that since popoldest() needs

1702

# free up enough cost. We don't do that since popoldest() needs

1703

# to walk the linked list and doing this in a loop would be

1703

# to walk the linked list and doing this in a loop would be

1704

# quadratic. So we find the first non-empty node and then

1704

# quadratic. So we find the first non-empty node and then

1705

# walk nodes until we free up enough capacity.

1705

# walk nodes until we free up enough capacity.

1706

#

1706

#

1707

# If we only removed the minimum number of nodes to free enough

1707

# If we only removed the minimum number of nodes to free enough

1708

# cost at insert time, chances are high that the next insert would

1708

# cost at insert time, chances are high that the next insert would

1709

# also require pruning. This would effectively constitute quadratic

1709

# also require pruning. This would effectively constitute quadratic

1710

# behavior for insert-heavy workloads. To mitigate this, we set a

1710

# behavior for insert-heavy workloads. To mitigate this, we set a

1711

# target cost that is a percentage of the max cost. This will tend

1711

# target cost that is a percentage of the max cost. This will tend

1712

# to free more nodes when the high water mark is reached, which

1712

# to free more nodes when the high water mark is reached, which

1713

# lowers the chances of needing to prune on the subsequent insert.

1713

# lowers the chances of needing to prune on the subsequent insert.

1714

targetcost = int(self.maxcost * 0.75)

1714

targetcost = int(self.maxcost * 0.75)

1715

1716

n = self._head.prev

1716

n = self._head.prev

1717

while n.key is _notset:

1717

while n.key is _notset:

1718

n = n.prev

1718

n = n.prev

1719

1720

while len(self) > 1 and self.totalcost > targetcost:

1720

while len(self) > 1 and self.totalcost > targetcost:

1721

del self._cache[n.key]

1721

del self._cache[n.key]

1722

self.totalcost -= n.cost

1722

self.totalcost -= n.cost

1723

n.markempty()

1723

n.markempty()

1724

n = n.prev

1724

n = n.prev

1725

1726

1727

def lrucachefunc(func):

1727

def lrucachefunc(func):

1728

'''cache most recent results of function calls'''

1728

'''cache most recent results of function calls'''

1729

cache = {}

1729

cache = {}

1730

order = collections.deque()

1730

order = collections.deque()

1731

if func.__code__.co_argcount == 1:

1731

if func.__code__.co_argcount == 1:

1732

1733

def f(arg):

1733

def f(arg):

1734

if arg not in cache:

1734

if arg not in cache:

1735

if len(cache) > 20:

1735

if len(cache) > 20:

1736

del cache[order.popleft()]

1736

del cache[order.popleft()]

1737

cache[arg] = func(arg)

1737

cache[arg] = func(arg)

1738

else:

1738

else:

1739

order.remove(arg)

1739

order.remove(arg)

1740

order.append(arg)

1740

order.append(arg)

1741

return cache[arg]

1741

return cache[arg]

1742

1743

else:

1743

else:

1744

1745

def f(*args):

1745

def f(*args):

1746

if args not in cache:

1746

if args not in cache:

1747

if len(cache) > 20:

1747

if len(cache) > 20:

1748

del cache[order.popleft()]

1748

del cache[order.popleft()]

1749

cache[args] = func(*args)

1749

cache[args] = func(*args)

1750

else:

1750

else:

1751

order.remove(args)

1751

order.remove(args)

1752

order.append(args)

1752

order.append(args)

1753

return cache[args]

1753

return cache[args]

1754

1755

return f

1755

return f

1756

1757

1758

class propertycache(object):

1758

class propertycache(object):

1759

def __init__(self, func):

1759

def __init__(self, func):

1760

self.func = func

1760

self.func = func

1761

self.name = func.__name__

1761

self.name = func.__name__

1762

1763

def __get__(self, obj, type=None):

1763

def __get__(self, obj, type=None):

1764

result = self.func(obj)

1764

result = self.func(obj)

1765

self.cachevalue(obj, result)

1765

self.cachevalue(obj, result)

1766

return result

1766

return result

1767

1768

def cachevalue(self, obj, value):

1768

def cachevalue(self, obj, value):

1769

# __dict__ assignment required to bypass __setattr__ (eg: repoview)

1769

# __dict__ assignment required to bypass __setattr__ (eg: repoview)

1770

obj.__dict__[self.name] = value

1770

obj.__dict__[self.name] = value

1771

1772

1773

def clearcachedproperty(obj, prop):

1773

def clearcachedproperty(obj, prop):

1774

'''clear a cached property value, if one has been set'''

1774

'''clear a cached property value, if one has been set'''

1775

prop = pycompat.sysstr(prop)

1775

prop = pycompat.sysstr(prop)

1776

if prop in obj.__dict__:

1776

if prop in obj.__dict__:

1777

del obj.__dict__[prop]

1777

del obj.__dict__[prop]

1778

1779

1780

def increasingchunks(source, min=1024, max=65536):

1780

def increasingchunks(source, min=1024, max=65536):

1781

"""return no less than min bytes per chunk while data remains,

1781

"""return no less than min bytes per chunk while data remains,

1782

doubling min after each chunk until it reaches max"""

1782

doubling min after each chunk until it reaches max"""

1783

1784

def log2(x):

1784

def log2(x):

1785

if not x:

1785

if not x:

1786

return 0

1786

return 0

1787

i = 0

1787

i = 0

1788

while x:

1788

while x:

1789

x >>= 1

1789

x >>= 1

1790

i += 1

1790

i += 1

1791

return i - 1

1791

return i - 1

1792

1793

buf = []

1793

buf = []

1794

blen = 0

1794

blen = 0

1795

for chunk in source:

1795

for chunk in source:

1796

buf.append(chunk)

1796

buf.append(chunk)

1797

blen += len(chunk)

1797

blen += len(chunk)

1798

if blen >= min:

1798

if blen >= min:

1799

if min < max:

1799

if min < max:

1800

min = min << 1

1800

min = min << 1

1801

nmin = 1 << log2(blen)

1801

nmin = 1 << log2(blen)

1802

if nmin > min:

1802

if nmin > min:

1803

min = nmin

1803

min = nmin

1804

if min > max:

1804

if min > max:

1805

min = max

1805

min = max

1806

yield b''.join(buf)

1806

yield b''.join(buf)

1807

blen = 0

1807

blen = 0

1808

buf = []

1808

buf = []

1809

if buf:

1809

if buf:

1810

yield b''.join(buf)

1810

yield b''.join(buf)

1811

1812

1813

def always(fn):

1813

def always(fn):

1814

return True

1814

return True

1815

1816

1817

def never(fn):

1817

def never(fn):

1818

return False

1818

return False

1819

1820

1821

def nogc(func):

1821

def nogc(func):

1822

"""disable garbage collector

1822

"""disable garbage collector

1823

1824

Python's garbage collector triggers a GC each time a certain number of

1824

Python's garbage collector triggers a GC each time a certain number of

1825

container objects (the number being defined by gc.get_threshold()) are

1825

container objects (the number being defined by gc.get_threshold()) are

1826

allocated even when marked not to be tracked by the collector. Tracking has

1826

allocated even when marked not to be tracked by the collector. Tracking has

1827

no effect on when GCs are triggered, only on what objects the GC looks

1827

no effect on when GCs are triggered, only on what objects the GC looks

1828

into. As a workaround, disable GC while building complex (huge)

1828

into. As a workaround, disable GC while building complex (huge)

1829

containers.

1829

containers.

1830

1831

This garbage collector issue have been fixed in 2.7. But it still affect

1831

This garbage collector issue have been fixed in 2.7. But it still affect

1832

CPython's performance.

1832

CPython's performance.

1833

"""

1833

"""

1834

1835

def wrapper(*args, **kwargs):

1835

def wrapper(*args, **kwargs):

1836

gcenabled = gc.isenabled()

1836

gcenabled = gc.isenabled()

1837

gc.disable()

1837

gc.disable()

1838

try:

1838

try:

1839

return func(*args, **kwargs)

1839

return func(*args, **kwargs)

1840

finally:

1840

finally:

1841

if gcenabled:

1841

if gcenabled:

1842

gc.enable()

1842

gc.enable()

1843

1844

return wrapper

1844

return wrapper

1845

1846

1847

if pycompat.ispypy:

1847

if pycompat.ispypy:

1848

# PyPy runs slower with gc disabled

1848

# PyPy runs slower with gc disabled

1849

nogc = lambda x: x

1849

nogc = lambda x: x

1850

1851

1852

def pathto(root, n1, n2):

1852

def pathto(root, n1, n2):

1853

# type: (bytes, bytes, bytes) -> bytes

1853

# type: (bytes, bytes, bytes) -> bytes

1854

"""return the relative path from one place to another.

1854

"""return the relative path from one place to another.

1855

root should use os.sep to separate directories

1855

root should use os.sep to separate directories

1856

n1 should use os.sep to separate directories

1856

n1 should use os.sep to separate directories

1857

n2 should use "/" to separate directories

1857

n2 should use "/" to separate directories

1858

returns an os.sep-separated path.

1858

returns an os.sep-separated path.

1859

1860

If n1 is a relative path, it's assumed it's

1860

If n1 is a relative path, it's assumed it's

1861

relative to root.

1861

relative to root.

1862

n2 should always be relative to root.

1862

n2 should always be relative to root.

1863

"""

1863

"""

1864

if not n1:

1864

if not n1:

1865

return localpath(n2)

1865

return localpath(n2)

1866

if os.path.isabs(n1):

1866

if os.path.isabs(n1):

1867

if os.path.splitdrive(root)[0] != os.path.splitdrive(n1)[0]:

1867

if os.path.splitdrive(root)[0] != os.path.splitdrive(n1)[0]:

1868

return os.path.join(root, localpath(n2))

1868

return os.path.join(root, localpath(n2))

1869

n2 = b'/'.join((pconvert(root), n2))

1869

n2 = b'/'.join((pconvert(root), n2))

1870

a, b = splitpath(n1), n2.split(b'/')

1870

a, b = splitpath(n1), n2.split(b'/')

1871

a.reverse()

1871

a.reverse()

1872

b.reverse()

1872

b.reverse()

1873

while a and b and a[-1] == b[-1]:

1873

while a and b and a[-1] == b[-1]:

1874

a.pop()

1874

a.pop()

1875

b.pop()

1875

b.pop()

1876

b.reverse()

1876

b.reverse()

1877

return pycompat.ossep.join(([b'..'] * len(a)) + b) or b'.'

1877

return pycompat.ossep.join(([b'..'] * len(a)) + b) or b'.'

1878

1879

1880

def checksignature(func, depth=1):

1880

def checksignature(func, depth=1):

1881

'''wrap a function with code to check for calling errors'''

1881

'''wrap a function with code to check for calling errors'''

1882

1883

def check(*args, **kwargs):

1883

def check(*args, **kwargs):

1884

try:

1884

try:

1885

return func(*args, **kwargs)

1885

return func(*args, **kwargs)

1886

except TypeError:

1886

except TypeError:

1887

if len(traceback.extract_tb(sys.exc_info()[2])) == depth:

1887

if len(traceback.extract_tb(sys.exc_info()[2])) == depth:

1888

raise error.SignatureError

1888

raise error.SignatureError

1889

raise

1889

raise

1890

1891

return check

1891

return check

1892

1893

1894

# a whilelist of known filesystems where hardlink works reliably

1894

# a whilelist of known filesystems where hardlink works reliably

1895

_hardlinkfswhitelist = {

1895

_hardlinkfswhitelist = {

1896

b'apfs',

1896

b'apfs',

1897

b'btrfs',

1897

b'btrfs',

1898

b'ext2',

1898

b'ext2',

1899

b'ext3',

1899

b'ext3',

1900

b'ext4',

1900

b'ext4',

1901

b'hfs',

1901

b'hfs',

1902

b'jfs',

1902

b'jfs',

1903

b'NTFS',

1903

b'NTFS',

1904

b'reiserfs',

1904

b'reiserfs',

1905

b'tmpfs',

1905

b'tmpfs',

1906

b'ufs',

1906

b'ufs',

1907

b'xfs',

1907

b'xfs',

1908

b'zfs',

1908

b'zfs',

1909

}

1909

}

1910

1911

1912

def copyfile(src, dest, hardlink=False, copystat=False, checkambig=False):

1912

def copyfile(

1913

src, dest, hardlink=False, copystat=False, checkambig=False, nb_bytes=None

1914

):

1913

"""copy a file, preserving mode and optionally other stat info like

1915

"""copy a file, preserving mode and optionally other stat info like

1914

atime/mtime

1916

atime/mtime

1915

1917

1916

checkambig argument is used with filestat, and is useful only if

1918

checkambig argument is used with filestat, and is useful only if

1917

destination file is guarded by any lock (e.g. repo.lock or

1919

destination file is guarded by any lock (e.g. repo.lock or

1918

repo.wlock).

1920

repo.wlock).

1919

1921

1920

copystat and checkambig should be exclusive.

1922

copystat and checkambig should be exclusive.

1923

1924

nb_bytes: if set only copy the first `nb_bytes` of the source file.

1921

"""

1925

"""

1922

assert not (copystat and checkambig)

1926

assert not (copystat and checkambig)

1923

oldstat = None

1927

oldstat = None

1924

if os.path.lexists(dest):

1928

if os.path.lexists(dest):

1925

if checkambig:

1929

if checkambig:

1926

oldstat = checkambig and filestat.frompath(dest)

1930

oldstat = checkambig and filestat.frompath(dest)

1927

unlink(dest)

1931

unlink(dest)

1928

if hardlink:

1932

if hardlink:

1929

# Hardlinks are problematic on CIFS (issue4546), do not allow hardlinks

1933

# Hardlinks are problematic on CIFS (issue4546), do not allow hardlinks

1930

# unless we are confident that dest is on a whitelisted filesystem.

1934

# unless we are confident that dest is on a whitelisted filesystem.

1931

try:

1935

try:

1932

fstype = getfstype(os.path.dirname(dest))

1936

fstype = getfstype(os.path.dirname(dest))

1933

except OSError:

1937

except OSError:

1934

fstype = None

1938

fstype = None

1935

if fstype not in _hardlinkfswhitelist:

1939

if fstype not in _hardlinkfswhitelist:

1936

hardlink = False

1940

hardlink = False

1937

if hardlink:

1941

if hardlink:

1938

try:

1942

try:

1939

oslink(src, dest)

1943

oslink(src, dest)

1944

if nb_bytes is not None:

1945

m = "the `nb_bytes` argument is incompatible with `hardlink`"

1946

raise error.ProgrammingError(m)

1940

return

1947

return

1941

except (IOError, OSError):

1948

except (IOError, OSError):

1942

pass # fall back to normal copy

1949

pass # fall back to normal copy

1943

if os.path.islink(src):

1950

if os.path.islink(src):

1944

os.symlink(os.readlink(src), dest)

1951

os.symlink(os.readlink(src), dest)

1945

# copytime is ignored for symlinks, but in general copytime isn't needed

1952

# copytime is ignored for symlinks, but in general copytime isn't needed

1946

# for them anyway

1953

# for them anyway

1954

if nb_bytes is not None:

1955

m = "cannot use `nb_bytes` on a symlink"

1956

raise error.ProgrammingError(m)

1947

else:

1957

else:

1948

try:

1958

try:

1949

shutil.copyfile(src, dest)

1959

shutil.copyfile(src, dest)

1950

if copystat:

1960

if copystat:

1951

# copystat also copies mode

1961

# copystat also copies mode

1952

shutil.copystat(src, dest)

1962

shutil.copystat(src, dest)

1953

else:

1963

else:

1954

shutil.copymode(src, dest)

1964

shutil.copymode(src, dest)

1955

if oldstat and oldstat.stat:

1965

if oldstat and oldstat.stat:

1956

newstat = filestat.frompath(dest)

1966

newstat = filestat.frompath(dest)

1957

if newstat.isambig(oldstat):

1967

if newstat.isambig(oldstat):

1958

# stat of copied file is ambiguous to original one

1968

# stat of copied file is ambiguous to original one

1959

advanced = (

1969

advanced = (

1960

oldstat.stat[stat.ST_MTIME] + 1

1970

oldstat.stat[stat.ST_MTIME] + 1

1961

) & 0x7FFFFFFF

1971

) & 0x7FFFFFFF

1962

os.utime(dest, (advanced, advanced))

1972

os.utime(dest, (advanced, advanced))

1973

# We could do something smarter using `copy_file_range` call or similar

1974

if nb_bytes is not None:

1975

with open(dest, mode='r+') as f:

1976

f.truncate(nb_bytes)

1963

except shutil.Error as inst:

1977

except shutil.Error as inst:

1964

raise error.Abort(stringutil.forcebytestr(inst))

1978

raise error.Abort(stringutil.forcebytestr(inst))

1965

1979

1966

1980

1967

def copyfiles(src, dst, hardlink=None, progress=None):

1981

def copyfiles(src, dst, hardlink=None, progress=None):

1968

"""Copy a directory tree using hardlinks if possible."""

1982

"""Copy a directory tree using hardlinks if possible."""

1969

num = 0

1983

num = 0

1970

1984

1971

def settopic():

1985

def settopic():

1972

if progress:

1986

if progress:

1973

progress.topic = _(b'linking') if hardlink else _(b'copying')

1987

progress.topic = _(b'linking') if hardlink else _(b'copying')

1974

1988

1975

if os.path.isdir(src):

1989

if os.path.isdir(src):

1976

if hardlink is None:

1990

if hardlink is None:

1977

hardlink = (

1991

hardlink = (

1978

os.stat(src).st_dev == os.stat(os.path.dirname(dst)).st_dev

1992

os.stat(src).st_dev == os.stat(os.path.dirname(dst)).st_dev

1979

)

1993

)

1980

settopic()

1994

settopic()

1981

os.mkdir(dst)

1995

os.mkdir(dst)

1982

for name, kind in listdir(src):

1996

for name, kind in listdir(src):

1983

srcname = os.path.join(src, name)

1997

srcname = os.path.join(src, name)

1984

dstname = os.path.join(dst, name)

1998

dstname = os.path.join(dst, name)

1985

hardlink, n = copyfiles(srcname, dstname, hardlink, progress)

1999

hardlink, n = copyfiles(srcname, dstname, hardlink, progress)

1986

num += n

2000

num += n

1987

else:

2001

else:

1988

if hardlink is None:

2002

if hardlink is None:

1989

hardlink = (

2003

hardlink = (

1990

os.stat(os.path.dirname(src)).st_dev

2004

os.stat(os.path.dirname(src)).st_dev

1991

== os.stat(os.path.dirname(dst)).st_dev

2005

== os.stat(os.path.dirname(dst)).st_dev

1992

)

2006

)

1993

settopic()

2007

settopic()

1994

2008

1995

if hardlink:

2009

if hardlink:

1996

try:

2010

try:

1997

oslink(src, dst)

2011

oslink(src, dst)

1998

except (IOError, OSError):

2012

except (IOError, OSError):

1999

hardlink = False

2013

hardlink = False

2000

shutil.copy(src, dst)

2014

shutil.copy(src, dst)

2001

else:

2015

else:

2002

shutil.copy(src, dst)

2016

shutil.copy(src, dst)

2003

num += 1

2017

num += 1

2004

if progress:

2018

if progress:

2005

progress.increment()

2019

progress.increment()

2006

2020

2007

return hardlink, num

2021

return hardlink, num

2008

2022

2009

2023

2010

_winreservednames = {

2024

_winreservednames = {

2011

b'con',

2025

b'con',

2012

b'prn',

2026

b'prn',

2013

b'aux',

2027

b'aux',

2014

b'nul',

2028

b'nul',

2015

b'com1',

2029

b'com1',

2016

b'com2',

2030

b'com2',

2017

b'com3',

2031

b'com3',

2018

b'com4',

2032

b'com4',

2019

b'com5',

2033

b'com5',

2020

b'com6',

2034

b'com6',

2021

b'com7',

2035

b'com7',

2022

b'com8',

2036

b'com8',

2023

b'com9',

2037

b'com9',

2024

b'lpt1',

2038

b'lpt1',

2025

b'lpt2',

2039

b'lpt2',

2026

b'lpt3',

2040

b'lpt3',

2027

b'lpt4',

2041

b'lpt4',

2028

b'lpt5',

2042

b'lpt5',

2029

b'lpt6',

2043

b'lpt6',

2030

b'lpt7',

2044

b'lpt7',

2031

b'lpt8',

2045

b'lpt8',

2032

b'lpt9',

2046

b'lpt9',

2033

}

2047

}

2034

_winreservedchars = b':*?"<>|'

2048

_winreservedchars = b':*?"<>|'

2035

2049

2036

2050

2037

def checkwinfilename(path):

2051

def checkwinfilename(path):

2038

# type: (bytes) -> Optional[bytes]

2052

# type: (bytes) -> Optional[bytes]

2039

r"""Check that the base-relative path is a valid filename on Windows.

2053

r"""Check that the base-relative path is a valid filename on Windows.

2040

Returns None if the path is ok, or a UI string describing the problem.

2054

Returns None if the path is ok, or a UI string describing the problem.

2041

2055

2042

>>> checkwinfilename(b"just/a/normal/path")

2056

>>> checkwinfilename(b"just/a/normal/path")

2043

>>> checkwinfilename(b"foo/bar/con.xml")

2057

>>> checkwinfilename(b"foo/bar/con.xml")

2044

"filename contains 'con', which is reserved on Windows"

2058

"filename contains 'con', which is reserved on Windows"

2045

>>> checkwinfilename(b"foo/con.xml/bar")

2059

>>> checkwinfilename(b"foo/con.xml/bar")

2046

"filename contains 'con', which is reserved on Windows"

2060

"filename contains 'con', which is reserved on Windows"

2047

>>> checkwinfilename(b"foo/bar/xml.con")

2061

>>> checkwinfilename(b"foo/bar/xml.con")

2048

>>> checkwinfilename(b"foo/bar/AUX/bla.txt")

2062

>>> checkwinfilename(b"foo/bar/AUX/bla.txt")

2049

"filename contains 'AUX', which is reserved on Windows"

2063

"filename contains 'AUX', which is reserved on Windows"

2050

>>> checkwinfilename(b"foo/bar/bla:.txt")

2064

>>> checkwinfilename(b"foo/bar/bla:.txt")

2051

"filename contains ':', which is reserved on Windows"

2065

"filename contains ':', which is reserved on Windows"

2052

>>> checkwinfilename(b"foo/bar/b\07la.txt")

2066

>>> checkwinfilename(b"foo/bar/b\07la.txt")

2053

"filename contains '\\x07', which is invalid on Windows"

2067

"filename contains '\\x07', which is invalid on Windows"

2054

>>> checkwinfilename(b"foo/bar/bla ")

2068

>>> checkwinfilename(b"foo/bar/bla ")

2055

"filename ends with ' ', which is not allowed on Windows"

2069

"filename ends with ' ', which is not allowed on Windows"

2056

>>> checkwinfilename(b"../bar")

2070

>>> checkwinfilename(b"../bar")

2057

>>> checkwinfilename(b"foo\\")

2071

>>> checkwinfilename(b"foo\\")

2058

"filename ends with '\\', which is invalid on Windows"

2072

"filename ends with '\\', which is invalid on Windows"

2059

>>> checkwinfilename(b"foo\\/bar")

2073

>>> checkwinfilename(b"foo\\/bar")

2060

"directory name ends with '\\', which is invalid on Windows"

2074

"directory name ends with '\\', which is invalid on Windows"

2061

"""

2075

"""

2062

if path.endswith(b'\\'):

2076

if path.endswith(b'\\'):

2063

return _(b"filename ends with '\\', which is invalid on Windows")

2077

return _(b"filename ends with '\\', which is invalid on Windows")

2064

if b'\\/' in path:

2078

if b'\\/' in path:

2065

return _(b"directory name ends with '\\', which is invalid on Windows")

2079

return _(b"directory name ends with '\\', which is invalid on Windows")

2066

for n in path.replace(b'\\', b'/').split(b'/'):

2080

for n in path.replace(b'\\', b'/').split(b'/'):

2067

if not n:

2081

if not n:

2068

continue

2082

continue

2069

for c in _filenamebytestr(n):

2083

for c in _filenamebytestr(n):

2070

if c in _winreservedchars:

2084

if c in _winreservedchars:

2071

return (

2085

return (

2072

_(

2086

_(

2073

b"filename contains '%s', which is reserved "

2087

b"filename contains '%s', which is reserved "

2074

b"on Windows"

2088

b"on Windows"

2075

)

2089

)

2076

% c

2090

% c

2077

)

2091

)

2078

if ord(c) <= 31:

2092

if ord(c) <= 31:

2079

return _(

2093

return _(

2080

b"filename contains '%s', which is invalid on Windows"

2094

b"filename contains '%s', which is invalid on Windows"

2081

) % stringutil.escapestr(c)

2095

) % stringutil.escapestr(c)

2082

base = n.split(b'.')[0]

2096

base = n.split(b'.')[0]

2083

if base and base.lower() in _winreservednames:

2097

if base and base.lower() in _winreservednames:

2084

return (

2098

return (

2085

_(b"filename contains '%s', which is reserved on Windows")

2099

_(b"filename contains '%s', which is reserved on Windows")

2086

% base

2100

% base

2087

)

2101

)

2088

t = n[-1:]

2102

t = n[-1:]

2089

if t in b'. ' and n not in b'..':

2103

if t in b'. ' and n not in b'..':

2090

return (

2104

return (

2091

_(

2105

_(

2092

b"filename ends with '%s', which is not allowed "

2106

b"filename ends with '%s', which is not allowed "

2093

b"on Windows"

2107

b"on Windows"

2094

)

2108

)

2095

% t

2109

% t

2096

)

2110

)

2097

2111

2098

2112

2099

timer = getattr(time, "perf_counter", None)

2113

timer = getattr(time, "perf_counter", None)

2100

2114

2101

if pycompat.iswindows:

2115

if pycompat.iswindows:

2102

checkosfilename = checkwinfilename

2116

checkosfilename = checkwinfilename

2103

if not timer:

2117

if not timer:

2104

timer = time.clock

2118

timer = time.clock

2105

else:

2119

else:

2106

# mercurial.windows doesn't have platform.checkosfilename

2120

# mercurial.windows doesn't have platform.checkosfilename

2107

checkosfilename = platform.checkosfilename # pytype: disable=module-attr

2121

checkosfilename = platform.checkosfilename # pytype: disable=module-attr

2108

if not timer:

2122

if not timer:

2109

timer = time.time

2123

timer = time.time

2110

2124

2111

2125

2112

def makelock(info, pathname):

2126

def makelock(info, pathname):

2113

"""Create a lock file atomically if possible

2127

"""Create a lock file atomically if possible

2114

2128

2115

This may leave a stale lock file if symlink isn't supported and signal

2129

This may leave a stale lock file if symlink isn't supported and signal

2116

interrupt is enabled.

2130

interrupt is enabled.

2117

"""

2131

"""

2118

try:

2132

try:

2119

return os.symlink(info, pathname)

2133

return os.symlink(info, pathname)

2120

except OSError as why:

2134

except OSError as why:

2121

if why.errno == errno.EEXIST:

2135

if why.errno == errno.EEXIST:

2122

raise

2136

raise

2123

except AttributeError: # no symlink in os

2137

except AttributeError: # no symlink in os

2124

pass

2138

pass

2125

2139

2126

flags = os.O_CREAT | os.O_WRONLY | os.O_EXCL | getattr(os, 'O_BINARY', 0)

2140

flags = os.O_CREAT | os.O_WRONLY | os.O_EXCL | getattr(os, 'O_BINARY', 0)

2127

ld = os.open(pathname, flags)

2141

ld = os.open(pathname, flags)

2128

os.write(ld, info)

2142

os.write(ld, info)

2129

os.close(ld)

2143

os.close(ld)

2130

2144

2131

2145

2132

def readlock(pathname):

2146

def readlock(pathname):

2133

# type: (bytes) -> bytes

2147

# type: (bytes) -> bytes

2134

try:

2148

try:

2135

return readlink(pathname)

2149

return readlink(pathname)

2136

except OSError as why:

2150

except OSError as why:

2137

if why.errno not in (errno.EINVAL, errno.ENOSYS):

2151

if why.errno not in (errno.EINVAL, errno.ENOSYS):

2138

raise

2152

raise

2139

except AttributeError: # no symlink in os

2153

except AttributeError: # no symlink in os

2140

pass

2154

pass

2141

with posixfile(pathname, b'rb') as fp:

2155

with posixfile(pathname, b'rb') as fp:

2142

return fp.read()

2156

return fp.read()

2143

2157

2144

2158

2145

def fstat(fp):

2159

def fstat(fp):

2146

'''stat file object that may not have fileno method.'''

2160

'''stat file object that may not have fileno method.'''

2147

try:

2161

try:

2148

return os.fstat(fp.fileno())

2162

return os.fstat(fp.fileno())

2149

except AttributeError:

2163

except AttributeError:

2150

return os.stat(fp.name)

2164

return os.stat(fp.name)

2151

2165

2152

2166

2153

# File system features

2167

# File system features

2154

2168

2155

2169

2156

def fscasesensitive(path):

2170

def fscasesensitive(path):

2157

# type: (bytes) -> bool

2171

# type: (bytes) -> bool

2158

"""

2172

"""

2159

Return true if the given path is on a case-sensitive filesystem

2173

Return true if the given path is on a case-sensitive filesystem

2160

2174

2161

Requires a path (like /foo/.hg) ending with a foldable final

2175

Requires a path (like /foo/.hg) ending with a foldable final

2162

directory component.

2176

directory component.

2163

"""

2177

"""

2164

s1 = os.lstat(path)

2178

s1 = os.lstat(path)

2165

d, b = os.path.split(path)

2179

d, b = os.path.split(path)

2166

b2 = b.upper()

2180

b2 = b.upper()

2167

if b == b2:

2181

if b == b2:

2168

b2 = b.lower()

2182

b2 = b.lower()

2169

if b == b2:

2183

if b == b2:

2170

return True # no evidence against case sensitivity

2184

return True # no evidence against case sensitivity

2171

p2 = os.path.join(d, b2)

2185

p2 = os.path.join(d, b2)

2172

try:

2186

try:

2173

s2 = os.lstat(p2)

2187

s2 = os.lstat(p2)

2174

if s2 == s1:

2188

if s2 == s1:

2175

return False

2189

return False

2176

return True

2190

return True

2177

except OSError:

2191

except OSError:

2178

return True

2192

return True

2179

2193

2180

2194

2181

_re2_input = lambda x: x

2195

_re2_input = lambda x: x

2182

try:

2196

try:

2183

import re2 # pytype: disable=import-error

2197

import re2 # pytype: disable=import-error

2184

2198

2185

_re2 = None

2199

_re2 = None

2186

except ImportError:

2200

except ImportError:

2187

_re2 = False

2201

_re2 = False

2188

2202

2189

2203

2190

class _re(object):

2204

class _re(object):

2191

def _checkre2(self):

2205

def _checkre2(self):

2192

global _re2

2206

global _re2

2193

global _re2_input

2207

global _re2_input

2194

2208

2195

check_pattern = br'\[([^\[]+)\]'

2209

check_pattern = br'\[([^\[]+)\]'

2196

check_input = b'[ui]'

2210

check_input = b'[ui]'

2197

try:

2211

try:

2198

# check if match works, see issue3964

2212

# check if match works, see issue3964

2199

_re2 = bool(re2.match(check_pattern, check_input))

2213

_re2 = bool(re2.match(check_pattern, check_input))

2200

except ImportError:

2214

except ImportError:

2201

_re2 = False

2215

_re2 = False

2202

except TypeError:

2216

except TypeError:

2203

# the `pyre-2` project provides a re2 module that accept bytes

2217

# the `pyre-2` project provides a re2 module that accept bytes

2204

# the `fb-re2` project provides a re2 module that acccept sysstr

2218

# the `fb-re2` project provides a re2 module that acccept sysstr

2205

check_pattern = pycompat.sysstr(check_pattern)

2219

check_pattern = pycompat.sysstr(check_pattern)

2206

check_input = pycompat.sysstr(check_input)

2220

check_input = pycompat.sysstr(check_input)

2207

_re2 = bool(re2.match(check_pattern, check_input))

2221

_re2 = bool(re2.match(check_pattern, check_input))

2208

_re2_input = pycompat.sysstr

2222

_re2_input = pycompat.sysstr

2209

2223

2210

def compile(self, pat, flags=0):

2224

def compile(self, pat, flags=0):

2211

"""Compile a regular expression, using re2 if possible

2225

"""Compile a regular expression, using re2 if possible

2212

2226

2213

For best performance, use only re2-compatible regexp features. The

2227

For best performance, use only re2-compatible regexp features. The

2214

only flags from the re module that are re2-compatible are

2228

only flags from the re module that are re2-compatible are

2215

IGNORECASE and MULTILINE."""

2229

IGNORECASE and MULTILINE."""

2216

if _re2 is None:

2230

if _re2 is None:

2217

self._checkre2()

2231

self._checkre2()

2218

if _re2 and (flags & ~(remod.IGNORECASE | remod.MULTILINE)) == 0:

2232

if _re2 and (flags & ~(remod.IGNORECASE | remod.MULTILINE)) == 0:

2219

if flags & remod.IGNORECASE:

2233

if flags & remod.IGNORECASE:

2220

pat = b'(?i)' + pat

2234

pat = b'(?i)' + pat

2221

if flags & remod.MULTILINE:

2235

if flags & remod.MULTILINE:

2222

pat = b'(?m)' + pat

2236

pat = b'(?m)' + pat

2223

try:

2237

try:

2224

return re2.compile(_re2_input(pat))

2238

return re2.compile(_re2_input(pat))

2225

except re2.error:

2239

except re2.error:

2226

pass

2240

pass

2227

return remod.compile(pat, flags)

2241

return remod.compile(pat, flags)

2228

2242

2229

@propertycache

2243

@propertycache

2230

def escape(self):

2244

def escape(self):

2231

"""Return the version of escape corresponding to self.compile.

2245

"""Return the version of escape corresponding to self.compile.

2232

2246

2233

This is imperfect because whether re2 or re is used for a particular

2247

This is imperfect because whether re2 or re is used for a particular

2234

function depends on the flags, etc, but it's the best we can do.

2248

function depends on the flags, etc, but it's the best we can do.

2235

"""

2249

"""

2236

global _re2

2250

global _re2

2237

if _re2 is None:

2251

if _re2 is None:

2238

self._checkre2()

2252

self._checkre2()

2239

if _re2:

2253

if _re2:

2240

return re2.escape

2254

return re2.escape

2241

else:

2255

else:

2242

return remod.escape

2256

return remod.escape

2243

2257

2244

2258

2245

re = _re()

2259

re = _re()

2246

2260

2247

_fspathcache = {}

2261

_fspathcache = {}

2248

2262

2249

2263

2250

def fspath(name, root):

2264

def fspath(name, root):

2251

# type: (bytes, bytes) -> bytes

2265

# type: (bytes, bytes) -> bytes

2252

"""Get name in the case stored in the filesystem

2266

"""Get name in the case stored in the filesystem

2253

2267

2254

The name should be relative to root, and be normcase-ed for efficiency.

2268

The name should be relative to root, and be normcase-ed for efficiency.

2255

2269

2256

Note that this function is unnecessary, and should not be

2270

Note that this function is unnecessary, and should not be

2257

called, for case-sensitive filesystems (simply because it's expensive).

2271

called, for case-sensitive filesystems (simply because it's expensive).

2258

2272

2259

The root should be normcase-ed, too.

2273

The root should be normcase-ed, too.

2260

"""

2274

"""

2261

2275

2262

def _makefspathcacheentry(dir):

2276

def _makefspathcacheentry(dir):

2263

return {normcase(n): n for n in os.listdir(dir)}

2277

return {normcase(n): n for n in os.listdir(dir)}

2264

2278

2265

seps = pycompat.ossep

2279

seps = pycompat.ossep

2266

if pycompat.osaltsep:

2280

if pycompat.osaltsep:

2267

seps = seps + pycompat.osaltsep

2281

seps = seps + pycompat.osaltsep

2268

# Protect backslashes. This gets silly very quickly.

2282

# Protect backslashes. This gets silly very quickly.

2269

seps.replace(b'\\', b'\\\\')

2283

seps.replace(b'\\', b'\\\\')

2270

pattern = remod.compile(br'([^%s]+)|([%s]+)' % (seps, seps))

2284

pattern = remod.compile(br'([^%s]+)|([%s]+)' % (seps, seps))

2271

dir = os.path.normpath(root)

2285

dir = os.path.normpath(root)

2272

result = []

2286

result = []

2273

for part, sep in pattern.findall(name):

2287

for part, sep in pattern.findall(name):

2274

if sep:

2288

if sep:

2275

result.append(sep)

2289

result.append(sep)

2276

continue

2290

continue

2277

2291

2278

if dir not in _fspathcache:

2292

if dir not in _fspathcache:

2279

_fspathcache[dir] = _makefspathcacheentry(dir)

2293

_fspathcache[dir] = _makefspathcacheentry(dir)

2280

contents = _fspathcache[dir]

2294

contents = _fspathcache[dir]

2281

2295

2282

found = contents.get(part)

2296

found = contents.get(part)

2283

if not found:

2297

if not found:

2284

# retry "once per directory" per "dirstate.walk" which

2298

# retry "once per directory" per "dirstate.walk" which

2285

# may take place for each patches of "hg qpush", for example

2299

# may take place for each patches of "hg qpush", for example

2286

_fspathcache[dir] = contents = _makefspathcacheentry(dir)

2300

_fspathcache[dir] = contents = _makefspathcacheentry(dir)

2287

found = contents.get(part)

2301

found = contents.get(part)

2288

2302

2289

result.append(found or part)

2303

result.append(found or part)

2290

dir = os.path.join(dir, part)

2304

dir = os.path.join(dir, part)

2291

2305

2292

return b''.join(result)

2306

return b''.join(result)

2293

2307

2294

2308

2295

def checknlink(testfile):

2309

def checknlink(testfile):

2296

# type: (bytes) -> bool

2310

# type: (bytes) -> bool

2297

'''check whether hardlink count reporting works properly'''

2311

'''check whether hardlink count reporting works properly'''

2298

2312

2299

# testfile may be open, so we need a separate file for checking to

2313

# testfile may be open, so we need a separate file for checking to

2300

# work around issue2543 (or testfile may get lost on Samba shares)

2314

# work around issue2543 (or testfile may get lost on Samba shares)

2301

f1, f2, fp = None, None, None

2315

f1, f2, fp = None, None, None

2302

try:

2316

try:

2303

fd, f1 = pycompat.mkstemp(

2317

fd, f1 = pycompat.mkstemp(

2304

prefix=b'.%s-' % os.path.basename(testfile),

2318

prefix=b'.%s-' % os.path.basename(testfile),

2305

suffix=b'1~',

2319

suffix=b'1~',

2306

dir=os.path.dirname(testfile),

2320

dir=os.path.dirname(testfile),

2307

)

2321

)

2308

os.close(fd)

2322

os.close(fd)

2309

f2 = b'%s2~' % f1[:-2]

2323

f2 = b'%s2~' % f1[:-2]

2310

2324

2311

oslink(f1, f2)

2325

oslink(f1, f2)

2312

# nlinks() may behave differently for files on Windows shares if

2326

# nlinks() may behave differently for files on Windows shares if

2313

# the file is open.

2327

# the file is open.

2314

fp = posixfile(f2)

2328

fp = posixfile(f2)

2315

return nlinks(f2) > 1

2329

return nlinks(f2) > 1

2316

except OSError:

2330

except OSError:

2317

return False

2331

return False

2318

finally:

2332

finally:

2319

if fp is not None:

2333

if fp is not None:

2320

fp.close()

2334

fp.close()

2321

for f in (f1, f2):

2335

for f in (f1, f2):

2322

try:

2336

try:

2323

if f is not None:

2337

if f is not None:

2324

os.unlink(f)

2338

os.unlink(f)

2325

except OSError:

2339

except OSError:

2326

pass

2340

pass

2327

2341

2328

2342

2329

def endswithsep(path):

2343

def endswithsep(path):

2330

# type: (bytes) -> bool

2344

# type: (bytes) -> bool

2331

'''Check path ends with os.sep or os.altsep.'''

2345

'''Check path ends with os.sep or os.altsep.'''

2332

return bool( # help pytype

2346

return bool( # help pytype

2333

path.endswith(pycompat.ossep)

2347

path.endswith(pycompat.ossep)

2334

or pycompat.osaltsep

2348

or pycompat.osaltsep

2335

and path.endswith(pycompat.osaltsep)

2349

and path.endswith(pycompat.osaltsep)

2336

)

2350

)

2337

2351

2338

2352

2339

def splitpath(path):

2353

def splitpath(path):

2340

# type: (bytes) -> List[bytes]

2354

# type: (bytes) -> List[bytes]

2341

"""Split path by os.sep.

2355

"""Split path by os.sep.

2342

Note that this function does not use os.altsep because this is

2356

Note that this function does not use os.altsep because this is

2343

an alternative of simple "xxx.split(os.sep)".

2357

an alternative of simple "xxx.split(os.sep)".

2344

It is recommended to use os.path.normpath() before using this

2358

It is recommended to use os.path.normpath() before using this

2345

function if need."""

2359

function if need."""

2346

return path.split(pycompat.ossep)

2360

return path.split(pycompat.ossep)

2347

2361

2348

2362

2349

def mktempcopy(name, emptyok=False, createmode=None, enforcewritable=False):

2363

def mktempcopy(name, emptyok=False, createmode=None, enforcewritable=False):

2350

"""Create a temporary file with the same contents from name

2364

"""Create a temporary file with the same contents from name

2351

2365

2352

The permission bits are copied from the original file.

2366

The permission bits are copied from the original file.

2353

2367

2354

If the temporary file is going to be truncated immediately, you

2368

If the temporary file is going to be truncated immediately, you

2355

can use emptyok=True as an optimization.

2369

can use emptyok=True as an optimization.

2356

2370

2357

Returns the name of the temporary file.

2371

Returns the name of the temporary file.

2358

"""

2372

"""

2359

d, fn = os.path.split(name)

2373

d, fn = os.path.split(name)

2360

fd, temp = pycompat.mkstemp(prefix=b'.%s-' % fn, suffix=b'~', dir=d)

2374

fd, temp = pycompat.mkstemp(prefix=b'.%s-' % fn, suffix=b'~', dir=d)

2361

os.close(fd)

2375

os.close(fd)

2362

# Temporary files are created with mode 0600, which is usually not

2376

# Temporary files are created with mode 0600, which is usually not

2363

# what we want. If the original file already exists, just copy

2377

# what we want. If the original file already exists, just copy

2364

# its mode. Otherwise, manually obey umask.

2378

# its mode. Otherwise, manually obey umask.

2365

copymode(name, temp, createmode, enforcewritable)

2379

copymode(name, temp, createmode, enforcewritable)

2366

2380

2367

if emptyok:

2381

if emptyok:

2368

return temp

2382

return temp

2369

try:

2383

try:

2370

try:

2384

try:

2371

ifp = posixfile(name, b"rb")

2385

ifp = posixfile(name, b"rb")

2372

except IOError as inst:

2386

except IOError as inst:

2373

if inst.errno == errno.ENOENT:

2387

if inst.errno == errno.ENOENT:

2374

return temp

2388

return temp

2375

if not getattr(inst, 'filename', None):

2389

if not getattr(inst, 'filename', None):

2376

inst.filename = name

2390

inst.filename = name

2377

raise

2391

raise

2378

ofp = posixfile(temp, b"wb")

2392

ofp = posixfile(temp, b"wb")

2379

for chunk in filechunkiter(ifp):

2393

for chunk in filechunkiter(ifp):

2380

ofp.write(chunk)

2394

ofp.write(chunk)

2381

ifp.close()

2395

ifp.close()

2382

ofp.close()

2396

ofp.close()

2383

except: # re-raises

2397

except: # re-raises

2384

try:

2398

try:

2385

os.unlink(temp)

2399

os.unlink(temp)

2386

except OSError:

2400

except OSError:

2387

pass

2401

pass

2388

raise

2402

raise

2389

return temp

2403

return temp

2390

2404

2391

2405

2392

class filestat(object):

2406

class filestat(object):

2393

"""help to exactly detect change of a file

2407

"""help to exactly detect change of a file

2394

2408

2395

'stat' attribute is result of 'os.stat()' if specified 'path'

2409

'stat' attribute is result of 'os.stat()' if specified 'path'

2396

exists. Otherwise, it is None. This can avoid preparative

2410

exists. Otherwise, it is None. This can avoid preparative

2397

'exists()' examination on client side of this class.

2411

'exists()' examination on client side of this class.

2398

"""

2412

"""

2399

2413

2400

def __init__(self, stat):

2414

def __init__(self, stat):

2401

self.stat = stat

2415

self.stat = stat

2402

2416

2403

@classmethod

2417

@classmethod

2404

def frompath(cls, path):

2418

def frompath(cls, path):

2405

try:

2419

try:

2406

stat = os.stat(path)

2420

stat = os.stat(path)

2407

except OSError as err:

2421

except OSError as err:

2408

if err.errno != errno.ENOENT:

2422

if err.errno != errno.ENOENT:

2409

raise

2423

raise

2410

stat = None

2424

stat = None

2411

return cls(stat)

2425

return cls(stat)

2412

2426

2413

@classmethod

2427

@classmethod

2414

def fromfp(cls, fp):

2428

def fromfp(cls, fp):

2415

stat = os.fstat(fp.fileno())

2429

stat = os.fstat(fp.fileno())

2416

return cls(stat)

2430

return cls(stat)

2417

2431

2418

__hash__ = object.__hash__

2432

__hash__ = object.__hash__

2419

2433

2420

def __eq__(self, old):

2434

def __eq__(self, old):

2421

try:

2435

try:

2422

# if ambiguity between stat of new and old file is

2436

# if ambiguity between stat of new and old file is

2423

# avoided, comparison of size, ctime and mtime is enough

2437

# avoided, comparison of size, ctime and mtime is enough

2424

# to exactly detect change of a file regardless of platform

2438

# to exactly detect change of a file regardless of platform

2425

return (

2439

return (

2426

self.stat.st_size == old.stat.st_size

2440

self.stat.st_size == old.stat.st_size

2427

and self.stat[stat.ST_CTIME] == old.stat[stat.ST_CTIME]

2441

and self.stat[stat.ST_CTIME] == old.stat[stat.ST_CTIME]

2428

and self.stat[stat.ST_MTIME] == old.stat[stat.ST_MTIME]

2442

and self.stat[stat.ST_MTIME] == old.stat[stat.ST_MTIME]

2429

)

2443

)

2430

except AttributeError:

2444

except AttributeError:

2431

pass

2445

pass

2432

try:

2446

try:

2433

return self.stat is None and old.stat is None

2447

return self.stat is None and old.stat is None

2434

except AttributeError:

2448

except AttributeError:

2435

return False

2449

return False

2436

2450

2437

def isambig(self, old):

2451

def isambig(self, old):

2438

"""Examine whether new (= self) stat is ambiguous against old one

2452

"""Examine whether new (= self) stat is ambiguous against old one

2439

2453

2440

"S[N]" below means stat of a file at N-th change:

2454

"S[N]" below means stat of a file at N-th change:

2441

2455

2442

- S[n-1].ctime < S[n].ctime: can detect change of a file

2456

- S[n-1].ctime < S[n].ctime: can detect change of a file

2443

- S[n-1].ctime == S[n].ctime

2457

- S[n-1].ctime == S[n].ctime

2444

- S[n-1].ctime < S[n].mtime: means natural advancing (*1)

2458

- S[n-1].ctime < S[n].mtime: means natural advancing (*1)

2445

- S[n-1].ctime == S[n].mtime: is ambiguous (*2)

2459

- S[n-1].ctime == S[n].mtime: is ambiguous (*2)

2446

- S[n-1].ctime > S[n].mtime: never occurs naturally (don't care)

2460

- S[n-1].ctime > S[n].mtime: never occurs naturally (don't care)

2447

- S[n-1].ctime > S[n].ctime: never occurs naturally (don't care)

2461

- S[n-1].ctime > S[n].ctime: never occurs naturally (don't care)

2448

2462

2449

Case (*2) above means that a file was changed twice or more at

2463

Case (*2) above means that a file was changed twice or more at

2450

same time in sec (= S[n-1].ctime), and comparison of timestamp

2464

same time in sec (= S[n-1].ctime), and comparison of timestamp

2451

is ambiguous.

2465

is ambiguous.

2452

2466

2453

Base idea to avoid such ambiguity is "advance mtime 1 sec, if

2467

Base idea to avoid such ambiguity is "advance mtime 1 sec, if

2454

timestamp is ambiguous".

2468

timestamp is ambiguous".

2455

2469

2456

But advancing mtime only in case (*2) doesn't work as

2470

But advancing mtime only in case (*2) doesn't work as

2457

expected, because naturally advanced S[n].mtime in case (*1)

2471

expected, because naturally advanced S[n].mtime in case (*1)

2458

might be equal to manually advanced S[n-1 or earlier].mtime.

2472

might be equal to manually advanced S[n-1 or earlier].mtime.

2459

2473

2460

Therefore, all "S[n-1].ctime == S[n].ctime" cases should be

2474

Therefore, all "S[n-1].ctime == S[n].ctime" cases should be

2461

treated as ambiguous regardless of mtime, to avoid overlooking

2475

treated as ambiguous regardless of mtime, to avoid overlooking

2462

by confliction between such mtime.

2476

by confliction between such mtime.

2463

2477

2464

Advancing mtime "if isambig(oldstat)" ensures "S[n-1].mtime !=

2478

Advancing mtime "if isambig(oldstat)" ensures "S[n-1].mtime !=

2465

S[n].mtime", even if size of a file isn't changed.

2479

S[n].mtime", even if size of a file isn't changed.

2466

"""

2480

"""

2467

try:

2481

try:

2468

return self.stat[stat.ST_CTIME] == old.stat[stat.ST_CTIME]

2482

return self.stat[stat.ST_CTIME] == old.stat[stat.ST_CTIME]

2469

except AttributeError:

2483

except AttributeError:

2470

return False

2484

return False

2471

2485

2472

def avoidambig(self, path, old):

2486

def avoidambig(self, path, old):

2473

"""Change file stat of specified path to avoid ambiguity

2487

"""Change file stat of specified path to avoid ambiguity

2474

2488

2475

'old' should be previous filestat of 'path'.

2489

'old' should be previous filestat of 'path'.

2476

2490

2477

This skips avoiding ambiguity, if a process doesn't have

2491

This skips avoiding ambiguity, if a process doesn't have

2478

appropriate privileges for 'path'. This returns False in this

2492

appropriate privileges for 'path'. This returns False in this

2479

case.

2493

case.

2480

2494

2481

Otherwise, this returns True, as "ambiguity is avoided".

2495

Otherwise, this returns True, as "ambiguity is avoided".

2482

"""

2496

"""

2483

advanced = (old.stat[stat.ST_MTIME] + 1) & 0x7FFFFFFF

2497

advanced = (old.stat[stat.ST_MTIME] + 1) & 0x7FFFFFFF

2484

try:

2498

try:

2485

os.utime(path, (advanced, advanced))

2499

os.utime(path, (advanced, advanced))

2486

except OSError as inst:

2500

except OSError as inst:

2487

if inst.errno == errno.EPERM:

2501

if inst.errno == errno.EPERM:

2488

# utime() on the file created by another user causes EPERM,

2502

# utime() on the file created by another user causes EPERM,

2489

# if a process doesn't have appropriate privileges

2503

# if a process doesn't have appropriate privileges

2490

return False

2504

return False

2491

raise

2505

raise

2492

return True

2506

return True

2493

2507

2494

def __ne__(self, other):

2508

def __ne__(self, other):

2495

return not self == other

2509

return not self == other

2496

2510

2497

2511

2498

class atomictempfile(object):

2512

class atomictempfile(object):

2499

"""writable file object that atomically updates a file

2513

"""writable file object that atomically updates a file

2500

2514

2501

All writes will go to a temporary copy of the original file. Call

2515

All writes will go to a temporary copy of the original file. Call

2502

close() when you are done writing, and atomictempfile will rename

2516

close() when you are done writing, and atomictempfile will rename

2503

the temporary copy to the original name, making the changes

2517

the temporary copy to the original name, making the changes

2504

visible. If the object is destroyed without being closed, all your

2518

visible. If the object is destroyed without being closed, all your

2505

writes are discarded.

2519

writes are discarded.

2506

2520

2507

checkambig argument of constructor is used with filestat, and is

2521

checkambig argument of constructor is used with filestat, and is

2508

useful only if target file is guarded by any lock (e.g. repo.lock

2522

useful only if target file is guarded by any lock (e.g. repo.lock

2509

or repo.wlock).

2523

or repo.wlock).

2510

"""

2524

"""

2511

2525

2512

def __init__(self, name, mode=b'w+b', createmode=None, checkambig=False):

2526

def __init__(self, name, mode=b'w+b', createmode=None, checkambig=False):

2513

self.__name = name # permanent name

2527

self.__name = name # permanent name

2514

self._tempname = mktempcopy(

2528

self._tempname = mktempcopy(

2515

name,

2529

name,

2516

emptyok=(b'w' in mode),

2530

emptyok=(b'w' in mode),

2517

createmode=createmode,

2531

createmode=createmode,

2518

enforcewritable=(b'w' in mode),

2532

enforcewritable=(b'w' in mode),

2519

)

2533

)

2520

2534

2521

self._fp = posixfile(self._tempname, mode)

2535

self._fp = posixfile(self._tempname, mode)

2522

self._checkambig = checkambig

2536

self._checkambig = checkambig

2523

2537

2524

# delegated methods

2538

# delegated methods

2525

self.read = self._fp.read

2539

self.read = self._fp.read

2526

self.write = self._fp.write

2540

self.write = self._fp.write

2527

self.seek = self._fp.seek

2541

self.seek = self._fp.seek

2528

self.tell = self._fp.tell

2542

self.tell = self._fp.tell

2529

self.fileno = self._fp.fileno

2543

self.fileno = self._fp.fileno

2530

2544

2531

def close(self):

2545

def close(self):

2532

if not self._fp.closed:

2546

if not self._fp.closed:

2533

self._fp.close()

2547

self._fp.close()

2534

filename = localpath(self.__name)

2548

filename = localpath(self.__name)

2535

oldstat = self._checkambig and filestat.frompath(filename)

2549

oldstat = self._checkambig and filestat.frompath(filename)

2536

if oldstat and oldstat.stat:

2550

if oldstat and oldstat.stat:

2537

rename(self._tempname, filename)

2551

rename(self._tempname, filename)

2538

newstat = filestat.frompath(filename)

2552

newstat = filestat.frompath(filename)

2539

if newstat.isambig(oldstat):

2553

if newstat.isambig(oldstat):

2540

# stat of changed file is ambiguous to original one

2554

# stat of changed file is ambiguous to original one

2541

advanced = (oldstat.stat[stat.ST_MTIME] + 1) & 0x7FFFFFFF

2555

advanced = (oldstat.stat[stat.ST_MTIME] + 1) & 0x7FFFFFFF

2542

os.utime(filename, (advanced, advanced))

2556

os.utime(filename, (advanced, advanced))

2543

else:

2557

else:

2544

rename(self._tempname, filename)

2558

rename(self._tempname, filename)

2545

2559

2546

def discard(self):

2560

def discard(self):

2547

if not self._fp.closed:

2561

if not self._fp.closed:

2548

try:

2562

try:

2549

os.unlink(self._tempname)

2563

os.unlink(self._tempname)

2550

except OSError:

2564

except OSError:

2551

pass

2565

pass

2552

self._fp.close()

2566

self._fp.close()

2553

2567

2554

def __del__(self):

2568

def __del__(self):

2555

if safehasattr(self, '_fp'): # constructor actually did something

2569

if safehasattr(self, '_fp'): # constructor actually did something

2556

self.discard()

2570

self.discard()

2557

2571

2558

def __enter__(self):

2572

def __enter__(self):

2559

return self

2573

return self

2560

2574

2561

def __exit__(self, exctype, excvalue, traceback):

2575

def __exit__(self, exctype, excvalue, traceback):

2562

if exctype is not None:

2576

if exctype is not None:

2563

self.discard()

2577

self.discard()

2564

else:

2578

else:

2565

self.close()

2579

self.close()

2566

2580

2567

2581

2568

def unlinkpath(f, ignoremissing=False, rmdir=True):

2582

def unlinkpath(f, ignoremissing=False, rmdir=True):

2569

# type: (bytes, bool, bool) -> None

2583

# type: (bytes, bool, bool) -> None

2570

"""unlink and remove the directory if it is empty"""

2584

"""unlink and remove the directory if it is empty"""

2571

if ignoremissing:

2585

if ignoremissing:

2572

tryunlink(f)

2586

tryunlink(f)

2573

else:

2587

else:

2574

unlink(f)

2588

unlink(f)

2575

if rmdir:

2589

if rmdir:

2576

# try removing directories that might now be empty

2590

# try removing directories that might now be empty

2577

try:

2591

try:

2578

removedirs(os.path.dirname(f))

2592

removedirs(os.path.dirname(f))

2579

except OSError:

2593

except OSError:

2580

pass

2594

pass

2581

2595

2582

2596

2583

def tryunlink(f):

2597

def tryunlink(f):

2584

# type: (bytes) -> None

2598

# type: (bytes) -> None

2585

"""Attempt to remove a file, ignoring ENOENT errors."""

2599

"""Attempt to remove a file, ignoring ENOENT errors."""

2586

try:

2600

try:

2587

unlink(f)

2601

unlink(f)

2588

except OSError as e:

2602

except OSError as e:

2589

if e.errno != errno.ENOENT:

2603

if e.errno != errno.ENOENT:

2590

raise

2604

raise

2591

2605

2592

2606

2593

def makedirs(name, mode=None, notindexed=False):

2607

def makedirs(name, mode=None, notindexed=False):

2594

# type: (bytes, Optional[int], bool) -> None

2608

# type: (bytes, Optional[int], bool) -> None

2595

"""recursive directory creation with parent mode inheritance

2609

"""recursive directory creation with parent mode inheritance

2596

2610

2597

Newly created directories are marked as "not to be indexed by

2611

Newly created directories are marked as "not to be indexed by

2598

the content indexing service", if ``notindexed`` is specified

2612

the content indexing service", if ``notindexed`` is specified

2599

for "write" mode access.

2613

for "write" mode access.

2600

"""

2614

"""

2601

try:

2615

try:

2602

makedir(name, notindexed)

2616

makedir(name, notindexed)

2603

except OSError as err:

2617

except OSError as err:

2604

if err.errno == errno.EEXIST:

2618

if err.errno == errno.EEXIST:

2605

return

2619

return

2606

if err.errno != errno.ENOENT or not name:

2620

if err.errno != errno.ENOENT or not name:

2607

raise

2621

raise

2608

parent = os.path.dirname(os.path.abspath(name))

2622

parent = os.path.dirname(os.path.abspath(name))

2609

if parent == name:

2623

if parent == name:

2610

raise

2624

raise

2611

makedirs(parent, mode, notindexed)

2625

makedirs(parent, mode, notindexed)

2612

try:

2626

try:

2613

makedir(name, notindexed)

2627

makedir(name, notindexed)

2614

except OSError as err:

2628

except OSError as err:

2615

# Catch EEXIST to handle races

2629

# Catch EEXIST to handle races

2616

if err.errno == errno.EEXIST:

2630

if err.errno == errno.EEXIST:

2617

return

2631

return

2618

raise

2632

raise

2619

if mode is not None:

2633

if mode is not None:

2620

os.chmod(name, mode)

2634

os.chmod(name, mode)

2621

2635

2622

2636

2623

def readfile(path):

2637

def readfile(path):

2624

# type: (bytes) -> bytes

2638

# type: (bytes) -> bytes

2625

with open(path, b'rb') as fp:

2639

with open(path, b'rb') as fp:

2626

return fp.read()

2640

return fp.read()

2627

2641

2628

2642

2629

def writefile(path, text):

2643

def writefile(path, text):

2630

# type: (bytes, bytes) -> None

2644

# type: (bytes, bytes) -> None

2631

with open(path, b'wb') as fp:

2645

with open(path, b'wb') as fp:

2632

fp.write(text)

2646

fp.write(text)

2633

2647

2634

2648

2635

def appendfile(path, text):

2649

def appendfile(path, text):

2636

# type: (bytes, bytes) -> None

2650

# type: (bytes, bytes) -> None

2637

with open(path, b'ab') as fp:

2651

with open(path, b'ab') as fp:

2638

fp.write(text)

2652

fp.write(text)

2639

2653

2640

2654

2641

class chunkbuffer(object):

2655

class chunkbuffer(object):

2642

"""Allow arbitrary sized chunks of data to be efficiently read from an

2656

"""Allow arbitrary sized chunks of data to be efficiently read from an

2643

iterator over chunks of arbitrary size."""

2657

iterator over chunks of arbitrary size."""

2644

2658

2645

def __init__(self, in_iter):

2659

def __init__(self, in_iter):

2646

"""in_iter is the iterator that's iterating over the input chunks."""

2660

"""in_iter is the iterator that's iterating over the input chunks."""

2647

2661

2648

def splitbig(chunks):

2662

def splitbig(chunks):

2649

for chunk in chunks:

2663

for chunk in chunks:

2650

if len(chunk) > 2 ** 20:

2664

if len(chunk) > 2 ** 20:

2651

pos = 0

2665

pos = 0

2652

while pos < len(chunk):

2666

while pos < len(chunk):

2653

end = pos + 2 ** 18

2667

end = pos + 2 ** 18

2654

yield chunk[pos:end]

2668

yield chunk[pos:end]

2655

pos = end

2669

pos = end

2656

else:

2670

else:

2657

yield chunk

2671

yield chunk

2658

2672

2659

self.iter = splitbig(in_iter)

2673

self.iter = splitbig(in_iter)

2660

self._queue = collections.deque()

2674

self._queue = collections.deque()

2661

self._chunkoffset = 0

2675

self._chunkoffset = 0

2662

2676

2663

def read(self, l=None):

2677

def read(self, l=None):

2664

"""Read L bytes of data from the iterator of chunks of data.

2678

"""Read L bytes of data from the iterator of chunks of data.

2665

Returns less than L bytes if the iterator runs dry.

2679

Returns less than L bytes if the iterator runs dry.

2666

2680

2667

If size parameter is omitted, read everything"""

2681

If size parameter is omitted, read everything"""

2668

if l is None:

2682

if l is None:

2669

return b''.join(self.iter)

2683

return b''.join(self.iter)

2670

2684

2671

left = l

2685

left = l

2672

buf = []

2686

buf = []

2673

queue = self._queue

2687

queue = self._queue

2674

while left > 0:

2688

while left > 0:

2675

# refill the queue

2689

# refill the queue

2676

if not queue:

2690

if not queue:

2677

target = 2 ** 18

2691

target = 2 ** 18

2678

for chunk in self.iter:

2692

for chunk in self.iter:

2679

queue.append(chunk)

2693

queue.append(chunk)

2680

target -= len(chunk)

2694

target -= len(chunk)

2681

if target <= 0:

2695

if target <= 0:

2682

break

2696

break

2683

if not queue:

2697

if not queue:

2684

break

2698

break

2685

2699

2686

# The easy way to do this would be to queue.popleft(), modify the

2700

# The easy way to do this would be to queue.popleft(), modify the

2687

# chunk (if necessary), then queue.appendleft(). However, for cases

2701

# chunk (if necessary), then queue.appendleft(). However, for cases

2688

# where we read partial chunk content, this incurs 2 dequeue

2702

# where we read partial chunk content, this incurs 2 dequeue

2689

# mutations and creates a new str for the remaining chunk in the

2703

# mutations and creates a new str for the remaining chunk in the

2690

# queue. Our code below avoids this overhead.

2704

# queue. Our code below avoids this overhead.

2691

2705

2692

chunk = queue[0]

2706

chunk = queue[0]

2693

chunkl = len(chunk)

2707

chunkl = len(chunk)

2694

offset = self._chunkoffset

2708

offset = self._chunkoffset

2695

2709

2696

# Use full chunk.

2710

# Use full chunk.

2697

if offset == 0 and left >= chunkl:

2711

if offset == 0 and left >= chunkl:

2698

left -= chunkl

2712

left -= chunkl

2699

queue.popleft()

2713

queue.popleft()

2700

buf.append(chunk)

2714

buf.append(chunk)

2701

# self._chunkoffset remains at 0.

2715

# self._chunkoffset remains at 0.

2702

continue

2716

continue

2703

2717

2704

chunkremaining = chunkl - offset

2718

chunkremaining = chunkl - offset

2705

2719

2706

# Use all of unconsumed part of chunk.

2720

# Use all of unconsumed part of chunk.

2707

if left >= chunkremaining:

2721

if left >= chunkremaining:

2708

left -= chunkremaining

2722

left -= chunkremaining

2709

queue.popleft()

2723

queue.popleft()

2710

# offset == 0 is enabled by block above, so this won't merely

2724

# offset == 0 is enabled by block above, so this won't merely

2711

# copy via ``chunk[0:]``.

2725

# copy via ``chunk[0:]``.

2712

buf.append(chunk[offset:])

2726

buf.append(chunk[offset:])

2713

self._chunkoffset = 0

2727

self._chunkoffset = 0

2714

2728

2715

# Partial chunk needed.

2729

# Partial chunk needed.

2716

else:

2730

else:

2717

buf.append(chunk[offset : offset + left])

2731

buf.append(chunk[offset : offset + left])

2718

self._chunkoffset += left

2732

self._chunkoffset += left

2719

left -= chunkremaining

2733

left -= chunkremaining

2720

2734

2721

return b''.join(buf)

2735

return b''.join(buf)

2722

2736

2723

2737

2724

def filechunkiter(f, size=131072, limit=None):

2738

def filechunkiter(f, size=131072, limit=None):

2725

"""Create a generator that produces the data in the file size

2739

"""Create a generator that produces the data in the file size

2726

(default 131072) bytes at a time, up to optional limit (default is

2740

(default 131072) bytes at a time, up to optional limit (default is

2727

to read all data). Chunks may be less than size bytes if the

2741

to read all data). Chunks may be less than size bytes if the

2728

chunk is the last chunk in the file, or the file is a socket or

2742

chunk is the last chunk in the file, or the file is a socket or

2729

some other type of file that sometimes reads less data than is

2743

some other type of file that sometimes reads less data than is

2730

requested."""

2744

requested."""

2731

assert size >= 0

2745

assert size >= 0

2732

assert limit is None or limit >= 0

2746

assert limit is None or limit >= 0

2733

while True:

2747

while True:

2734

if limit is None:

2748

if limit is None:

2735

nbytes = size

2749

nbytes = size

2736

else:

2750

else:

2737

nbytes = min(limit, size)

2751

nbytes = min(limit, size)

2738

s = nbytes and f.read(nbytes)

2752

s = nbytes and f.read(nbytes)

2739

if not s:

2753

if not s:

2740

break

2754

break

2741

if limit:

2755

if limit:

2742

limit -= len(s)

2756

limit -= len(s)

2743

yield s

2757

yield s

2744

2758

2745

2759

2746

class cappedreader(object):

2760

class cappedreader(object):

2747

"""A file object proxy that allows reading up to N bytes.

2761

"""A file object proxy that allows reading up to N bytes.

2748

2762

2749

Given a source file object, instances of this type allow reading up to

2763

Given a source file object, instances of this type allow reading up to

2750

N bytes from that source file object. Attempts to read past the allowed

2764

N bytes from that source file object. Attempts to read past the allowed

2751

limit are treated as EOF.

2765

limit are treated as EOF.

2752

2766

2753

It is assumed that I/O is not performed on the original file object

2767

It is assumed that I/O is not performed on the original file object

2754

in addition to I/O that is performed by this instance. If there is,

2768

in addition to I/O that is performed by this instance. If there is,

2755

state tracking will get out of sync and unexpected results will ensue.

2769

state tracking will get out of sync and unexpected results will ensue.

2756

"""

2770

"""

2757

2771

2758

def __init__(self, fh, limit):

2772

def __init__(self, fh, limit):

2759

"""Allow reading up to <limit> bytes from <fh>."""

2773

"""Allow reading up to <limit> bytes from <fh>."""

2760

self._fh = fh

2774

self._fh = fh

2761

self._left = limit

2775

self._left = limit

2762

2776

2763

def read(self, n=-1):

2777

def read(self, n=-1):

2764

if not self._left:

2778

if not self._left:

2765

return b''

2779

return b''

2766

2780

2767

if n < 0:

2781

if n < 0:

2768

n = self._left

2782

n = self._left

2769

2783

2770

data = self._fh.read(min(n, self._left))

2784

data = self._fh.read(min(n, self._left))

2771

self._left -= len(data)

2785

self._left -= len(data)

2772

assert self._left >= 0

2786

assert self._left >= 0

2773

2787

2774

return data

2788

return data

2775

2789

2776

def readinto(self, b):

2790

def readinto(self, b):

2777

res = self.read(len(b))

2791

res = self.read(len(b))

2778

if res is None:

2792

if res is None:

2779

return None

2793

return None

2780

2794

2781

b[0 : len(res)] = res

2795

b[0 : len(res)] = res

2782

return len(res)

2796

return len(res)

2783

2797

2784

2798

2785

def unitcountfn(*unittable):

2799

def unitcountfn(*unittable):

2786

'''return a function that renders a readable count of some quantity'''

2800

'''return a function that renders a readable count of some quantity'''

2787

2801

2788

def go(count):

2802

def go(count):

2789

for multiplier, divisor, format in unittable:

2803

for multiplier, divisor, format in unittable:

2790

if abs(count) >= divisor * multiplier:

2804

if abs(count) >= divisor * multiplier:

2791

return format % (count / float(divisor))

2805

return format % (count / float(divisor))

2792

return unittable[-1][2] % count

2806

return unittable[-1][2] % count

2793

2807

2794

return go

2808

return go

2795

2809

2796

2810

2797

def processlinerange(fromline, toline):

2811

def processlinerange(fromline, toline):

2798

# type: (int, int) -> Tuple[int, int]

2812

# type: (int, int) -> Tuple[int, int]

2799

"""Check that linerange <fromline>:<toline> makes sense and return a

2813

"""Check that linerange <fromline>:<toline> makes sense and return a

2800

0-based range.

2814

0-based range.

2801

2815

2802

>>> processlinerange(10, 20)

2816

>>> processlinerange(10, 20)

2803

(9, 20)

2817

(9, 20)

2804

>>> processlinerange(2, 1)

2818

>>> processlinerange(2, 1)

2805

Traceback (most recent call last):

2819

Traceback (most recent call last):

2806

...

2820

...

2807

ParseError: line range must be positive

2821

ParseError: line range must be positive

2808

>>> processlinerange(0, 5)

2822

>>> processlinerange(0, 5)

2809

Traceback (most recent call last):

2823

Traceback (most recent call last):

2810

...

2824

...

2811

ParseError: fromline must be strictly positive

2825

ParseError: fromline must be strictly positive

2812

"""

2826

"""

2813

if toline - fromline < 0:

2827

if toline - fromline < 0:

2814

raise error.ParseError(_(b"line range must be positive"))

2828

raise error.ParseError(_(b"line range must be positive"))

2815

if fromline < 1:

2829

if fromline < 1:

2816

raise error.ParseError(_(b"fromline must be strictly positive"))

2830

raise error.ParseError(_(b"fromline must be strictly positive"))

2817

return fromline - 1, toline

2831

return fromline - 1, toline

2818

2832

2819

2833

2820

bytecount = unitcountfn(

2834

bytecount = unitcountfn(

2821

(100, 1 << 30, _(b'%.0f GB')),

2835

(100, 1 << 30, _(b'%.0f GB')),

2822

(10, 1 << 30, _(b'%.1f GB')),

2836

(10, 1 << 30, _(b'%.1f GB')),

2823

(1, 1 << 30, _(b'%.2f GB')),

2837

(1, 1 << 30, _(b'%.2f GB')),

2824

(100, 1 << 20, _(b'%.0f MB')),

2838

(100, 1 << 20, _(b'%.0f MB')),

2825

(10, 1 << 20, _(b'%.1f MB')),

2839

(10, 1 << 20, _(b'%.1f MB')),

2826

(1, 1 << 20, _(b'%.2f MB')),

2840

(1, 1 << 20, _(b'%.2f MB')),

2827

(100, 1 << 10, _(b'%.0f KB')),

2841

(100, 1 << 10, _(b'%.0f KB')),

2828

(10, 1 << 10, _(b'%.1f KB')),

2842

(10, 1 << 10, _(b'%.1f KB')),

2829

(1, 1 << 10, _(b'%.2f KB')),

2843

(1, 1 << 10, _(b'%.2f KB')),

2830

(1, 1, _(b'%.0f bytes')),

2844

(1, 1, _(b'%.0f bytes')),

2831

)

2845

)

2832

2846

2833

2847

2834

class transformingwriter(object):

2848

class transformingwriter(object):

2835

"""Writable file wrapper to transform data by function"""

2849

"""Writable file wrapper to transform data by function"""

2836

2850

2837

def __init__(self, fp, encode):

2851

def __init__(self, fp, encode):

2838

self._fp = fp

2852

self._fp = fp

2839

self._encode = encode

2853

self._encode = encode

2840

2854

2841

def close(self):

2855

def close(self):

2842

self._fp.close()

2856

self._fp.close()

2843

2857

2844

def flush(self):

2858

def flush(self):

2845

self._fp.flush()

2859

self._fp.flush()

2846

2860

2847

def write(self, data):

2861

def write(self, data):

2848

return self._fp.write(self._encode(data))

2862

return self._fp.write(self._encode(data))

2849

2863

2850

2864

2851

# Matches a single EOL which can either be a CRLF where repeated CR

2865

# Matches a single EOL which can either be a CRLF where repeated CR

2852

# are removed or a LF. We do not care about old Macintosh files, so a

2866

# are removed or a LF. We do not care about old Macintosh files, so a

2853

# stray CR is an error.

2867

# stray CR is an error.

2854

_eolre = remod.compile(br'\r*\n')

2868

_eolre = remod.compile(br'\r*\n')

2855

2869

2856

2870

2857

def tolf(s):

2871

def tolf(s):

2858

# type: (bytes) -> bytes

2872

# type: (bytes) -> bytes

2859

return _eolre.sub(b'\n', s)

2873

return _eolre.sub(b'\n', s)

2860

2874

2861

2875

2862

def tocrlf(s):

2876

def tocrlf(s):

2863

# type: (bytes) -> bytes

2877

# type: (bytes) -> bytes

2864

return _eolre.sub(b'\r\n', s)

2878

return _eolre.sub(b'\r\n', s)

2865

2879

2866

2880

2867

def _crlfwriter(fp):

2881

def _crlfwriter(fp):

2868

return transformingwriter(fp, tocrlf)

2882

return transformingwriter(fp, tocrlf)

2869

2883

2870

2884

2871

if pycompat.oslinesep == b'\r\n':

2885

if pycompat.oslinesep == b'\r\n':

2872

tonativeeol = tocrlf

2886

tonativeeol = tocrlf

2873

fromnativeeol = tolf

2887

fromnativeeol = tolf

2874

nativeeolwriter = _crlfwriter

2888

nativeeolwriter = _crlfwriter

2875

else:

2889

else:

2876

tonativeeol = pycompat.identity

2890

tonativeeol = pycompat.identity

2877

fromnativeeol = pycompat.identity

2891

fromnativeeol = pycompat.identity

2878

nativeeolwriter = pycompat.identity

2892

nativeeolwriter = pycompat.identity

2879

2893

2880

if pyplatform.python_implementation() == b'CPython' and sys.version_info < (

2894

if pyplatform.python_implementation() == b'CPython' and sys.version_info < (

2881

3,

2895

3,

2882

0,

2896

0,

2883

):

2897

):

2884

# There is an issue in CPython that some IO methods do not handle EINTR

2898

# There is an issue in CPython that some IO methods do not handle EINTR

2885

# correctly. The following table shows what CPython version (and functions)

2899

# correctly. The following table shows what CPython version (and functions)

2886

# are affected (buggy: has the EINTR bug, okay: otherwise):

2900

# are affected (buggy: has the EINTR bug, okay: otherwise):

2887

#

2901

#

2888

# | < 2.7.4 | 2.7.4 to 2.7.12 | >= 3.0

2902

# | < 2.7.4 | 2.7.4 to 2.7.12 | >= 3.0

2889

# --------------------------------------------------

2903

# --------------------------------------------------

2890

# fp.__iter__ | buggy | buggy | okay

2904

# fp.__iter__ | buggy | buggy | okay

2891

# fp.read* | buggy | okay [1] | okay

2905

# fp.read* | buggy | okay [1] | okay

2892

#

2906

#

2893

# [1]: fixed by changeset 67dc99a989cd in the cpython hg repo.

2907

# [1]: fixed by changeset 67dc99a989cd in the cpython hg repo.

2894

#

2908

#

2895

# Here we workaround the EINTR issue for fileobj.__iter__. Other methods

2909

# Here we workaround the EINTR issue for fileobj.__iter__. Other methods

2896

# like "read*" work fine, as we do not support Python < 2.7.4.

2910

# like "read*" work fine, as we do not support Python < 2.7.4.

2897

#

2911

#

2898

# Although we can workaround the EINTR issue for fp.__iter__, it is slower:

2912

# Although we can workaround the EINTR issue for fp.__iter__, it is slower:

2899

# "for x in fp" is 4x faster than "for x in iter(fp.readline, '')" in

2913

# "for x in fp" is 4x faster than "for x in iter(fp.readline, '')" in

2900

# CPython 2, because CPython 2 maintains an internal readahead buffer for

2914

# CPython 2, because CPython 2 maintains an internal readahead buffer for

2901

# fp.__iter__ but not other fp.read* methods.

2915

# fp.__iter__ but not other fp.read* methods.

2902

#

2916

#

2903

# On modern systems like Linux, the "read" syscall cannot be interrupted

2917

# On modern systems like Linux, the "read" syscall cannot be interrupted

2904

# when reading "fast" files like on-disk files. So the EINTR issue only

2918

# when reading "fast" files like on-disk files. So the EINTR issue only

2905

# affects things like pipes, sockets, ttys etc. We treat "normal" (S_ISREG)

2919

# affects things like pipes, sockets, ttys etc. We treat "normal" (S_ISREG)

2906

# files approximately as "fast" files and use the fast (unsafe) code path,

2920

# files approximately as "fast" files and use the fast (unsafe) code path,

2907

# to minimize the performance impact.

2921

# to minimize the performance impact.

2908

2922

2909

def iterfile(fp):

2923

def iterfile(fp):

2910

fastpath = True

2924

fastpath = True

2911

if type(fp) is file:

2925

if type(fp) is file:

2912

fastpath = stat.S_ISREG(os.fstat(fp.fileno()).st_mode)

2926

fastpath = stat.S_ISREG(os.fstat(fp.fileno()).st_mode)

2913

if fastpath:

2927

if fastpath:

2914

return fp

2928

return fp

2915

else:

2929

else:

2916

# fp.readline deals with EINTR correctly, use it as a workaround.

2930

# fp.readline deals with EINTR correctly, use it as a workaround.

2917

return iter(fp.readline, b'')

2931

return iter(fp.readline, b'')

2918

2932

2919

2933

2920

else:

2934

else:

2921

# PyPy and CPython 3 do not have the EINTR issue thus no workaround needed.

2935

# PyPy and CPython 3 do not have the EINTR issue thus no workaround needed.

2922

def iterfile(fp):

2936

def iterfile(fp):

2923

return fp

2937

return fp

2924

2938

2925

2939

2926

def iterlines(iterator):

2940

def iterlines(iterator):

2927

# type: (Iterator[bytes]) -> Iterator[bytes]

2941

# type: (Iterator[bytes]) -> Iterator[bytes]

2928

for chunk in iterator:

2942

for chunk in iterator:

2929

for line in chunk.splitlines():

2943

for line in chunk.splitlines():

2930

yield line

2944

yield line

2931

2945

2932

2946

2933

def expandpath(path):

2947

def expandpath(path):

2934

# type: (bytes) -> bytes

2948

# type: (bytes) -> bytes

2935

return os.path.expanduser(os.path.expandvars(path))

2949

return os.path.expanduser(os.path.expandvars(path))

2936

2950

2937

2951

2938

def interpolate(prefix, mapping, s, fn=None, escape_prefix=False):

2952

def interpolate(prefix, mapping, s, fn=None, escape_prefix=False):

2939

"""Return the result of interpolating items in the mapping into string s.

2953

"""Return the result of interpolating items in the mapping into string s.

2940

2954

2941

prefix is a single character string, or a two character string with

2955

prefix is a single character string, or a two character string with

2942

a backslash as the first character if the prefix needs to be escaped in

2956

a backslash as the first character if the prefix needs to be escaped in

2943

a regular expression.

2957

a regular expression.

2944

2958

2945

fn is an optional function that will be applied to the replacement text

2959

fn is an optional function that will be applied to the replacement text

2946

just before replacement.

2960

just before replacement.

2947

2961

2948

escape_prefix is an optional flag that allows using doubled prefix for

2962

escape_prefix is an optional flag that allows using doubled prefix for

2949

its escaping.

2963

its escaping.

2950

"""

2964

"""

2951

fn = fn or (lambda s: s)

2965

fn = fn or (lambda s: s)

2952

patterns = b'|'.join(mapping.keys())

2966

patterns = b'|'.join(mapping.keys())

2953

if escape_prefix:

2967

if escape_prefix:

2954

patterns += b'|' + prefix

2968

patterns += b'|' + prefix

2955

if len(prefix) > 1:

2969

if len(prefix) > 1:

2956

prefix_char = prefix[1:]

2970

prefix_char = prefix[1:]

2957

else:

2971

else:

2958

prefix_char = prefix

2972

prefix_char = prefix

2959

mapping[prefix_char] = prefix_char

2973

mapping[prefix_char] = prefix_char

2960

r = remod.compile(br'%s(%s)' % (prefix, patterns))

2974

r = remod.compile(br'%s(%s)' % (prefix, patterns))

2961

return r.sub(lambda x: fn(mapping[x.group()[1:]]), s)

2975

return r.sub(lambda x: fn(mapping[x.group()[1:]]), s)

2962

2976

2963

2977

2964

def getport(*args, **kwargs):

2978

def getport(*args, **kwargs):

2965

msg = b'getport(...) moved to mercurial.utils.urlutil'

2979

msg = b'getport(...) moved to mercurial.utils.urlutil'

2966

nouideprecwarn(msg, b'6.0', stacklevel=2)

2980

nouideprecwarn(msg, b'6.0', stacklevel=2)

2967

return urlutil.getport(*args, **kwargs)

2981

return urlutil.getport(*args, **kwargs)

2968

2982

2969

2983

2970

def url(*args, **kwargs):

2984

def url(*args, **kwargs):

2971

msg = b'url(...) moved to mercurial.utils.urlutil'

2985

msg = b'url(...) moved to mercurial.utils.urlutil'

2972

nouideprecwarn(msg, b'6.0', stacklevel=2)

2986

nouideprecwarn(msg, b'6.0', stacklevel=2)

2973

return urlutil.url(*args, **kwargs)

2987

return urlutil.url(*args, **kwargs)

2974

2988

2975

2989

2976

def hasscheme(*args, **kwargs):

2990

def hasscheme(*args, **kwargs):

2977

msg = b'hasscheme(...) moved to mercurial.utils.urlutil'

2991

msg = b'hasscheme(...) moved to mercurial.utils.urlutil'

2978

nouideprecwarn(msg, b'6.0', stacklevel=2)

2992

nouideprecwarn(msg, b'6.0', stacklevel=2)

2979

return urlutil.hasscheme(*args, **kwargs)

2993

return urlutil.hasscheme(*args, **kwargs)

2980

2994

2981

2995

2982

def hasdriveletter(*args, **kwargs):

2996

def hasdriveletter(*args, **kwargs):

2983

msg = b'hasdriveletter(...) moved to mercurial.utils.urlutil'

2997

msg = b'hasdriveletter(...) moved to mercurial.utils.urlutil'

2984

nouideprecwarn(msg, b'6.0', stacklevel=2)

2998

nouideprecwarn(msg, b'6.0', stacklevel=2)

2985

return urlutil.hasdriveletter(*args, **kwargs)

2999

return urlutil.hasdriveletter(*args, **kwargs)

2986

3000

2987

3001

2988

def urllocalpath(*args, **kwargs):

3002

def urllocalpath(*args, **kwargs):

2989

msg = b'urllocalpath(...) moved to mercurial.utils.urlutil'

3003

msg = b'urllocalpath(...) moved to mercurial.utils.urlutil'

2990

nouideprecwarn(msg, b'6.0', stacklevel=2)

3004

nouideprecwarn(msg, b'6.0', stacklevel=2)

2991

return urlutil.urllocalpath(*args, **kwargs)

3005

return urlutil.urllocalpath(*args, **kwargs)

2992

3006

2993

3007

2994

def checksafessh(*args, **kwargs):

3008

def checksafessh(*args, **kwargs):

2995

msg = b'checksafessh(...) moved to mercurial.utils.urlutil'

3009

msg = b'checksafessh(...) moved to mercurial.utils.urlutil'

2996

nouideprecwarn(msg, b'6.0', stacklevel=2)

3010

nouideprecwarn(msg, b'6.0', stacklevel=2)

2997

return urlutil.checksafessh(*args, **kwargs)

3011

return urlutil.checksafessh(*args, **kwargs)

2998

3012

2999

3013

3000

def hidepassword(*args, **kwargs):

3014

def hidepassword(*args, **kwargs):

3001

msg = b'hidepassword(...) moved to mercurial.utils.urlutil'

3015

msg = b'hidepassword(...) moved to mercurial.utils.urlutil'

3002

nouideprecwarn(msg, b'6.0', stacklevel=2)

3016

nouideprecwarn(msg, b'6.0', stacklevel=2)

3003

return urlutil.hidepassword(*args, **kwargs)

3017

return urlutil.hidepassword(*args, **kwargs)

3004

3018

3005

3019

3006

def removeauth(*args, **kwargs):

3020

def removeauth(*args, **kwargs):

3007

msg = b'removeauth(...) moved to mercurial.utils.urlutil'

3021

msg = b'removeauth(...) moved to mercurial.utils.urlutil'

3008

nouideprecwarn(msg, b'6.0', stacklevel=2)

3022

nouideprecwarn(msg, b'6.0', stacklevel=2)

3009

return urlutil.removeauth(*args, **kwargs)

3023

return urlutil.removeauth(*args, **kwargs)

3010

3024

3011

3025

3012

timecount = unitcountfn(

3026

timecount = unitcountfn(

3013

(1, 1e3, _(b'%.0f s')),

3027

(1, 1e3, _(b'%.0f s')),

3014

(100, 1, _(b'%.1f s')),

3028

(100, 1, _(b'%.1f s')),

3015

(10, 1, _(b'%.2f s')),

3029

(10, 1, _(b'%.2f s')),

3016

(1, 1, _(b'%.3f s')),

3030

(1, 1, _(b'%.3f s')),

3017

(100, 0.001, _(b'%.1f ms')),

3031

(100, 0.001, _(b'%.1f ms')),

3018

(10, 0.001, _(b'%.2f ms')),

3032

(10, 0.001, _(b'%.2f ms')),

3019

(1, 0.001, _(b'%.3f ms')),

3033

(1, 0.001, _(b'%.3f ms')),

3020

(100, 0.000001, _(b'%.1f us')),

3034

(100, 0.000001, _(b'%.1f us')),

3021

(10, 0.000001, _(b'%.2f us')),

3035

(10, 0.000001, _(b'%.2f us')),

3022

(1, 0.000001, _(b'%.3f us')),

3036

(1, 0.000001, _(b'%.3f us')),

3023

(100, 0.000000001, _(b'%.1f ns')),

3037

(100, 0.000000001, _(b'%.1f ns')),

3024

(10, 0.000000001, _(b'%.2f ns')),

3038

(10, 0.000000001, _(b'%.2f ns')),

3025

(1, 0.000000001, _(b'%.3f ns')),

3039

(1, 0.000000001, _(b'%.3f ns')),

3026

)

3040

)

3027

3041

3028

3042

3029

@attr.s

3043

@attr.s

3030

class timedcmstats(object):

3044

class timedcmstats(object):

3031

"""Stats information produced by the timedcm context manager on entering."""

3045

"""Stats information produced by the timedcm context manager on entering."""

3032

3046

3033

# the starting value of the timer as a float (meaning and resulution is

3047

# the starting value of the timer as a float (meaning and resulution is

3034

# platform dependent, see util.timer)

3048

# platform dependent, see util.timer)

3035

start = attr.ib(default=attr.Factory(lambda: timer()))

3049

start = attr.ib(default=attr.Factory(lambda: timer()))

3036

# the number of seconds as a floating point value; starts at 0, updated when

3050

# the number of seconds as a floating point value; starts at 0, updated when

3037

# the context is exited.

3051

# the context is exited.

3038

elapsed = attr.ib(default=0)

3052

elapsed = attr.ib(default=0)

3039

# the number of nested timedcm context managers.

3053

# the number of nested timedcm context managers.

3040

level = attr.ib(default=1)

3054

level = attr.ib(default=1)

3041

3055

3042

def __bytes__(self):

3056

def __bytes__(self):

3043

return timecount(self.elapsed) if self.elapsed else b'<unknown>'

3057

return timecount(self.elapsed) if self.elapsed else b'<unknown>'

3044

3058

3045

__str__ = encoding.strmethod(__bytes__)

3059

__str__ = encoding.strmethod(__bytes__)

3046

3060

3047

3061

3048

@contextlib.contextmanager

3062

@contextlib.contextmanager

3049

def timedcm(whencefmt, *whenceargs):

3063

def timedcm(whencefmt, *whenceargs):

3050

"""A context manager that produces timing information for a given context.

3064

"""A context manager that produces timing information for a given context.

3051

3065

3052

On entering a timedcmstats instance is produced.

3066

On entering a timedcmstats instance is produced.

3053

3067

3054

This context manager is reentrant.

3068

This context manager is reentrant.

3055

3069

3056

"""

3070

"""

3057

# track nested context managers

3071

# track nested context managers

3058

timedcm._nested += 1

3072

timedcm._nested += 1

3059

timing_stats = timedcmstats(level=timedcm._nested)

3073

timing_stats = timedcmstats(level=timedcm._nested)

3060

try:

3074

try:

3061

with tracing.log(whencefmt, *whenceargs):

3075

with tracing.log(whencefmt, *whenceargs):

3062

yield timing_stats

3076

yield timing_stats

3063

finally:

3077

finally:

3064

timing_stats.elapsed = timer() - timing_stats.start

3078

timing_stats.elapsed = timer() - timing_stats.start

3065

timedcm._nested -= 1

3079

timedcm._nested -= 1

3066

3080

3067

3081

3068

timedcm._nested = 0

3082

timedcm._nested = 0

3069

3083

3070

3084

3071

def timed(func):

3085

def timed(func):

3072

"""Report the execution time of a function call to stderr.

3086

"""Report the execution time of a function call to stderr.

3073

3087

3074

During development, use as a decorator when you need to measure

3088

During development, use as a decorator when you need to measure

3075

the cost of a function, e.g. as follows:

3089

the cost of a function, e.g. as follows:

3076

3090

3077

@util.timed

3091

@util.timed

3078

def foo(a, b, c):

3092

def foo(a, b, c):

3079

pass

3093

pass

3080

"""

3094

"""

3081

3095

3082

def wrapper(*args, **kwargs):

3096

def wrapper(*args, **kwargs):

3083

with timedcm(pycompat.bytestr(func.__name__)) as time_stats:

3097

with timedcm(pycompat.bytestr(func.__name__)) as time_stats:

3084

result = func(*args, **kwargs)

3098

result = func(*args, **kwargs)

3085

stderr = procutil.stderr

3099

stderr = procutil.stderr

3086

stderr.write(

3100

stderr.write(

3087

b'%s%s: %s\n'

3101

b'%s%s: %s\n'

3088

% (

3102

% (

3089

b' ' * time_stats.level * 2,

3103

b' ' * time_stats.level * 2,

3090

pycompat.bytestr(func.__name__),

3104

pycompat.bytestr(func.__name__),

3091

time_stats,

3105

time_stats,

3092

)

3106

)

3093

)

3107

)

3094

return result

3108

return result

3095

3109

3096

return wrapper

3110

return wrapper

3097

3111

3098

3112

3099

_sizeunits = (

3113

_sizeunits = (

3100

(b'm', 2 ** 20),

3114

(b'm', 2 ** 20),

3101

(b'k', 2 ** 10),

3115

(b'k', 2 ** 10),

3102

(b'g', 2 ** 30),

3116

(b'g', 2 ** 30),

3103

(b'kb', 2 ** 10),

3117

(b'kb', 2 ** 10),

3104

(b'mb', 2 ** 20),

3118

(b'mb', 2 ** 20),

3105

(b'gb', 2 ** 30),

3119

(b'gb', 2 ** 30),

3106

(b'b', 1),

3120

(b'b', 1),

3107

)

3121

)

3108

3122

3109

3123

3110

def sizetoint(s):

3124

def sizetoint(s):

3111

# type: (bytes) -> int

3125

# type: (bytes) -> int

3112

"""Convert a space specifier to a byte count.

3126

"""Convert a space specifier to a byte count.

3113

3127

3114

>>> sizetoint(b'30')

3128

>>> sizetoint(b'30')

3115

30

3129

30

3116

>>> sizetoint(b'2.2kb')

3130

>>> sizetoint(b'2.2kb')

3117

2252

3131

2252

3118

>>> sizetoint(b'6M')

3132

>>> sizetoint(b'6M')

3119

6291456

3133

6291456

3120

"""

3134

"""

3121

t = s.strip().lower()

3135

t = s.strip().lower()

3122

try:

3136

try:

3123

for k, u in _sizeunits:

3137

for k, u in _sizeunits:

3124

if t.endswith(k):

3138

if t.endswith(k):

3125

return int(float(t[: -len(k)]) * u)

3139

return int(float(t[: -len(k)]) * u)

3126

return int(t)

3140

return int(t)

3127

except ValueError:

3141

except ValueError:

3128

raise error.ParseError(_(b"couldn't parse size: %s") % s)

3142

raise error.ParseError(_(b"couldn't parse size: %s") % s)

3129

3143

3130

3144

3131

class hooks(object):

3145

class hooks(object):

3132

"""A collection of hook functions that can be used to extend a

3146

"""A collection of hook functions that can be used to extend a

3133

function's behavior. Hooks are called in lexicographic order,

3147

function's behavior. Hooks are called in lexicographic order,

3134

based on the names of their sources."""

3148

based on the names of their sources."""

3135

3149

3136

def __init__(self):

3150

def __init__(self):

3137

self._hooks = []

3151

self._hooks = []

3138

3152

3139

def add(self, source, hook):

3153

def add(self, source, hook):

3140

self._hooks.append((source, hook))

3154

self._hooks.append((source, hook))

3141

3155

3142

def __call__(self, *args):

3156

def __call__(self, *args):

3143

self._hooks.sort(key=lambda x: x[0])

3157

self._hooks.sort(key=lambda x: x[0])

3144

results = []

3158

results = []

3145

for source, hook in self._hooks:

3159

for source, hook in self._hooks:

3146

results.append(hook(*args))

3160

results.append(hook(*args))

3147

return results

3161

return results

3148

3162

3149

3163

3150

def getstackframes(skip=0, line=b' %-*s in %s\n', fileline=b'%s:%d', depth=0):

3164

def getstackframes(skip=0, line=b' %-*s in %s\n', fileline=b'%s:%d', depth=0):

3151

"""Yields lines for a nicely formatted stacktrace.

3165

"""Yields lines for a nicely formatted stacktrace.

3152

Skips the 'skip' last entries, then return the last 'depth' entries.

3166

Skips the 'skip' last entries, then return the last 'depth' entries.

3153

Each file+linenumber is formatted according to fileline.

3167

Each file+linenumber is formatted according to fileline.

3154

Each line is formatted according to line.

3168

Each line is formatted according to line.

3155

If line is None, it yields:

3169

If line is None, it yields:

3156

length of longest filepath+line number,

3170

length of longest filepath+line number,

3157

filepath+linenumber,

3171

filepath+linenumber,

3158

function

3172

function

3159

3173

3160

Not be used in production code but very convenient while developing.

3174

Not be used in production code but very convenient while developing.

3161

"""

3175

"""

3162

entries = [

3176

entries = [

3163

(fileline % (pycompat.sysbytes(fn), ln), pycompat.sysbytes(func))

3177

(fileline % (pycompat.sysbytes(fn), ln), pycompat.sysbytes(func))

3164

for fn, ln, func, _text in traceback.extract_stack()[: -skip - 1]

3178

for fn, ln, func, _text in traceback.extract_stack()[: -skip - 1]

3165

][-depth:]

3179

][-depth:]

3166

if entries:

3180

if entries:

3167

fnmax = max(len(entry[0]) for entry in entries)

3181

fnmax = max(len(entry[0]) for entry in entries)

3168

for fnln, func in entries:

3182

for fnln, func in entries:

3169

if line is None:

3183

if line is None:

3170

yield (fnmax, fnln, func)

3184

yield (fnmax, fnln, func)

3171

else:

3185

else:

3172

yield line % (fnmax, fnln, func)

3186

yield line % (fnmax, fnln, func)

3173

3187

3174

3188

3175

def debugstacktrace(

3189

def debugstacktrace(

3176

msg=b'stacktrace',

3190

msg=b'stacktrace',

3177

skip=0,

3191

skip=0,

3178

f=procutil.stderr,

3192

f=procutil.stderr,

3179

otherf=procutil.stdout,

3193

otherf=procutil.stdout,

3180

depth=0,

3194

depth=0,

3181

prefix=b'',

3195

prefix=b'',

3182

):

3196

):

3183

"""Writes a message to f (stderr) with a nicely formatted stacktrace.

3197

"""Writes a message to f (stderr) with a nicely formatted stacktrace.

3184

Skips the 'skip' entries closest to the call, then show 'depth' entries.

3198

Skips the 'skip' entries closest to the call, then show 'depth' entries.

3185

By default it will flush stdout first.

3199

By default it will flush stdout first.

3186

It can be used everywhere and intentionally does not require an ui object.

3200

It can be used everywhere and intentionally does not require an ui object.

3187

Not be used in production code but very convenient while developing.

3201

Not be used in production code but very convenient while developing.

3188

"""

3202

"""

3189

if otherf:

3203

if otherf:

3190

otherf.flush()

3204

otherf.flush()

3191

f.write(b'%s%s at:\n' % (prefix, msg.rstrip()))

3205

f.write(b'%s%s at:\n' % (prefix, msg.rstrip()))

3192

for line in getstackframes(skip + 1, depth=depth):

3206

for line in getstackframes(skip + 1, depth=depth):

3193

f.write(prefix + line)

3207

f.write(prefix + line)

3194

f.flush()

3208

f.flush()

3195

3209

3196

3210

3197

# convenient shortcut

3211

# convenient shortcut

3198

dst = debugstacktrace

3212

dst = debugstacktrace

3199

3213

3200

3214

3201

def safename(f, tag, ctx, others=None):

3215

def safename(f, tag, ctx, others=None):

3202

"""

3216

"""

3203

Generate a name that it is safe to rename f to in the given context.

3217

Generate a name that it is safe to rename f to in the given context.

3204

3218

3205

f: filename to rename

3219

f: filename to rename

3206

tag: a string tag that will be included in the new name

3220

tag: a string tag that will be included in the new name

3207

ctx: a context, in which the new name must not exist

3221

ctx: a context, in which the new name must not exist

3208

others: a set of other filenames that the new name must not be in

3222

others: a set of other filenames that the new name must not be in

3209

3223

3210

Returns a file name of the form oldname~tag[~number] which does not exist

3224

Returns a file name of the form oldname~tag[~number] which does not exist

3211

in the provided context and is not in the set of other names.

3225

in the provided context and is not in the set of other names.

3212

"""

3226

"""

3213

if others is None:

3227

if others is None:

3214

others = set()

3228

others = set()

3215

3229

3216

fn = b'%s~%s' % (f, tag)

3230

fn = b'%s~%s' % (f, tag)

3217

if fn not in ctx and fn not in others:

3231

if fn not in ctx and fn not in others:

3218

return fn

3232

return fn

3219

for n in itertools.count(1):

3233

for n in itertools.count(1):

3220

fn = b'%s~%s~%s' % (f, tag, n)

3234

fn = b'%s~%s~%s' % (f, tag, n)

3221

if fn not in ctx and fn not in others:

3235

if fn not in ctx and fn not in others:

3222

return fn

3236

return fn

3223

3237

3224

3238

3225

def readexactly(stream, n):

3239

def readexactly(stream, n):

3226

'''read n bytes from stream.read and abort if less was available'''

3240

'''read n bytes from stream.read and abort if less was available'''

3227

s = stream.read(n)

3241

s = stream.read(n)

3228

if len(s) < n:

3242

if len(s) < n:

3229

raise error.Abort(

3243

raise error.Abort(

3230

_(b"stream ended unexpectedly (got %d bytes, expected %d)")

3244

_(b"stream ended unexpectedly (got %d bytes, expected %d)")

3231

% (len(s), n)

3245

% (len(s), n)

3232

)

3246

)

3233

return s

3247

return s

3234

3248

3235

3249

3236

def uvarintencode(value):

3250

def uvarintencode(value):

3237

"""Encode an unsigned integer value to a varint.

3251

"""Encode an unsigned integer value to a varint.

3238

3252

3239

A varint is a variable length integer of 1 or more bytes. Each byte

3253

A varint is a variable length integer of 1 or more bytes. Each byte

3240

except the last has the most significant bit set. The lower 7 bits of

3254

except the last has the most significant bit set. The lower 7 bits of

3241

each byte store the 2's complement representation, least significant group

3255

each byte store the 2's complement representation, least significant group

3242

first.

3256

first.

3243

3257

3244

>>> uvarintencode(0)

3258

>>> uvarintencode(0)

3245

'\\x00'

3259

'\\x00'

3246

>>> uvarintencode(1)

3260

>>> uvarintencode(1)

3247

'\\x01'

3261

'\\x01'

3248

>>> uvarintencode(127)

3262

>>> uvarintencode(127)

3249

'\\x7f'

3263

'\\x7f'

3250

>>> uvarintencode(1337)

3264

>>> uvarintencode(1337)

3251

'\\xb9\\n'

3265

'\\xb9\\n'

3252

>>> uvarintencode(65536)

3266

>>> uvarintencode(65536)

3253

'\\x80\\x80\\x04'

3267

'\\x80\\x80\\x04'

3254

>>> uvarintencode(-1)

3268

>>> uvarintencode(-1)

3255

Traceback (most recent call last):

3269

Traceback (most recent call last):

3256

...

3270

...

3257

ProgrammingError: negative value for uvarint: -1

3271

ProgrammingError: negative value for uvarint: -1

3258

"""

3272

"""

3259

if value < 0:

3273

if value < 0:

3260

raise error.ProgrammingError(b'negative value for uvarint: %d' % value)

3274

raise error.ProgrammingError(b'negative value for uvarint: %d' % value)

3261

bits = value & 0x7F

3275

bits = value & 0x7F

3262

value >>= 7

3276

value >>= 7

3263

bytes = []

3277

bytes = []

3264

while value:

3278

while value:

3265

bytes.append(pycompat.bytechr(0x80 | bits))

3279

bytes.append(pycompat.bytechr(0x80 | bits))

3266

bits = value & 0x7F

3280

bits = value & 0x7F

3267

value >>= 7

3281

value >>= 7

3268

bytes.append(pycompat.bytechr(bits))

3282

bytes.append(pycompat.bytechr(bits))

3269

3283

3270

return b''.join(bytes)

3284

return b''.join(bytes)

3271

3285

3272

3286

3273

def uvarintdecodestream(fh):

3287

def uvarintdecodestream(fh):

3274

"""Decode an unsigned variable length integer from a stream.

3288

"""Decode an unsigned variable length integer from a stream.

3275

3289

3276

The passed argument is anything that has a ``.read(N)`` method.

3290

The passed argument is anything that has a ``.read(N)`` method.

3277

3291

3278

>>> try:

3292

>>> try:

3279

... from StringIO import StringIO as BytesIO

3293

... from StringIO import StringIO as BytesIO

3280

... except ImportError:

3294

... except ImportError:

3281

... from io import BytesIO

3295

... from io import BytesIO

3282

>>> uvarintdecodestream(BytesIO(b'\\x00'))

3296

>>> uvarintdecodestream(BytesIO(b'\\x00'))

3283

0

3297

0

3284

>>> uvarintdecodestream(BytesIO(b'\\x01'))

3298

>>> uvarintdecodestream(BytesIO(b'\\x01'))

3285

1

3299

1

3286

>>> uvarintdecodestream(BytesIO(b'\\x7f'))

3300

>>> uvarintdecodestream(BytesIO(b'\\x7f'))

3287

127

3301

127

3288

>>> uvarintdecodestream(BytesIO(b'\\xb9\\n'))

3302

>>> uvarintdecodestream(BytesIO(b'\\xb9\\n'))

3289

1337

3303

1337

3290

>>> uvarintdecodestream(BytesIO(b'\\x80\\x80\\x04'))

3304

>>> uvarintdecodestream(BytesIO(b'\\x80\\x80\\x04'))

3291

65536

3305

65536

3292

>>> uvarintdecodestream(BytesIO(b'\\x80'))

3306

>>> uvarintdecodestream(BytesIO(b'\\x80'))

3293

Traceback (most recent call last):

3307

Traceback (most recent call last):

3294

...

3308

...

3295

Abort: stream ended unexpectedly (got 0 bytes, expected 1)

3309

Abort: stream ended unexpectedly (got 0 bytes, expected 1)

3296

"""

3310

"""

3297

result = 0

3311

result = 0

3298

shift = 0

3312

shift = 0

3299

while True:

3313

while True:

3300

byte = ord(readexactly(fh, 1))

3314

byte = ord(readexactly(fh, 1))

3301

result |= (byte & 0x7F) << shift

3315

result |= (byte & 0x7F) << shift

3302

if not (byte & 0x80):

3316

if not (byte & 0x80):

3303

return result

3317

return result

3304

shift += 7

3318

shift += 7

3305

3319

3306

3320

3307

# Passing the '' locale means that the locale should be set according to the

3321

# Passing the '' locale means that the locale should be set according to the

3308

# user settings (environment variables).

3322

# user settings (environment variables).

3309

# Python sometimes avoids setting the global locale settings. When interfacing

3323

# Python sometimes avoids setting the global locale settings. When interfacing

3310

# with C code (e.g. the curses module or the Subversion bindings), the global

3324

# with C code (e.g. the curses module or the Subversion bindings), the global

3311

# locale settings must be initialized correctly. Python 2 does not initialize

3325

# locale settings must be initialized correctly. Python 2 does not initialize

3312

# the global locale settings on interpreter startup. Python 3 sometimes

3326

# the global locale settings on interpreter startup. Python 3 sometimes

3313

# initializes LC_CTYPE, but not consistently at least on Windows. Therefore we

3327

# initializes LC_CTYPE, but not consistently at least on Windows. Therefore we

3314

# explicitly initialize it to get consistent behavior if it's not already

3328

# explicitly initialize it to get consistent behavior if it's not already

3315

# initialized. Since CPython commit 177d921c8c03d30daa32994362023f777624b10d,

3329

# initialized. Since CPython commit 177d921c8c03d30daa32994362023f777624b10d,

3316

# LC_CTYPE is always initialized. If we require Python 3.8+, we should re-check

3330

# LC_CTYPE is always initialized. If we require Python 3.8+, we should re-check

3317

# if we can remove this code.

3331

# if we can remove this code.

3318

@contextlib.contextmanager

3332

@contextlib.contextmanager

3319

def with_lc_ctype():

3333

def with_lc_ctype():

3320

oldloc = locale.setlocale(locale.LC_CTYPE, None)

3334

oldloc = locale.setlocale(locale.LC_CTYPE, None)

3321

if oldloc == 'C':

3335

if oldloc == 'C':

3322

try:

3336

try:

3323

try:

3337

try:

3324

locale.setlocale(locale.LC_CTYPE, '')

3338

locale.setlocale(locale.LC_CTYPE, '')

3325

except locale.Error:

3339

except locale.Error:

3326

# The likely case is that the locale from the environment

3340

# The likely case is that the locale from the environment

3327

# variables is unknown.

3341

# variables is unknown.

3328

pass

3342

pass

3329

yield

3343

yield

3330

finally:

3344

finally:

3331

locale.setlocale(locale.LC_CTYPE, oldloc)

3345

locale.setlocale(locale.LC_CTYPE, oldloc)

3332

else:

3346

else:

3333

yield

3347

yield

3334

3348

3335

3349

3336

def _estimatememory():

3350

def _estimatememory():

3337

# type: () -> Optional[int]

3351

# type: () -> Optional[int]

3338

"""Provide an estimate for the available system memory in Bytes.

3352

"""Provide an estimate for the available system memory in Bytes.

3339

3353

3340

If no estimate can be provided on the platform, returns None.

3354

If no estimate can be provided on the platform, returns None.

3341

"""

3355

"""

3342

if pycompat.sysplatform.startswith(b'win'):

3356

if pycompat.sysplatform.startswith(b'win'):

3343

# On Windows, use the GlobalMemoryStatusEx kernel function directly.

3357

# On Windows, use the GlobalMemoryStatusEx kernel function directly.

3344

from ctypes import c_long as DWORD, c_ulonglong as DWORDLONG

3358

from ctypes import c_long as DWORD, c_ulonglong as DWORDLONG

3345

from ctypes.wintypes import ( # pytype: disable=import-error

3359

from ctypes.wintypes import ( # pytype: disable=import-error

3346

Structure,

3360

Structure,

3347

byref,

3361

byref,

3348

sizeof,

3362

sizeof,

3349

windll,

3363

windll,

3350

)

3364

)

3351

3365

3352

class MEMORYSTATUSEX(Structure):

3366

class MEMORYSTATUSEX(Structure):

3353

_fields_ = [

3367

_fields_ = [

3354

('dwLength', DWORD),

3368

('dwLength', DWORD),

3355

('dwMemoryLoad', DWORD),

3369

('dwMemoryLoad', DWORD),

3356

('ullTotalPhys', DWORDLONG),

3370

('ullTotalPhys', DWORDLONG),

3357

('ullAvailPhys', DWORDLONG),

3371

('ullAvailPhys', DWORDLONG),

3358

('ullTotalPageFile', DWORDLONG),

3372

('ullTotalPageFile', DWORDLONG),

3359

('ullAvailPageFile', DWORDLONG),

3373

('ullAvailPageFile', DWORDLONG),

3360

('ullTotalVirtual', DWORDLONG),

3374

('ullTotalVirtual', DWORDLONG),

3361

('ullAvailVirtual', DWORDLONG),

3375

('ullAvailVirtual', DWORDLONG),

3362

('ullExtendedVirtual', DWORDLONG),

3376

('ullExtendedVirtual', DWORDLONG),

3363

]

3377

]

3364

3378

3365

x = MEMORYSTATUSEX()

3379

x = MEMORYSTATUSEX()

3366

x.dwLength = sizeof(x)

3380

x.dwLength = sizeof(x)

3367

windll.kernel32.GlobalMemoryStatusEx(byref(x))

3381

windll.kernel32.GlobalMemoryStatusEx(byref(x))

3368

return x.ullAvailPhys

3382

return x.ullAvailPhys

3369

3383

3370

# On newer Unix-like systems and Mac OSX, the sysconf interface

3384

# On newer Unix-like systems and Mac OSX, the sysconf interface

3371

# can be used. _SC_PAGE_SIZE is part of POSIX; _SC_PHYS_PAGES

3385

# can be used. _SC_PAGE_SIZE is part of POSIX; _SC_PHYS_PAGES

3372

# seems to be implemented on most systems.

3386

# seems to be implemented on most systems.

3373

try:

3387

try:

3374

pagesize = os.sysconf(os.sysconf_names['SC_PAGE_SIZE'])

3388

pagesize = os.sysconf(os.sysconf_names['SC_PAGE_SIZE'])

3375

pages = os.sysconf(os.sysconf_names['SC_PHYS_PAGES'])

3389

pages = os.sysconf(os.sysconf_names['SC_PHYS_PAGES'])

3376

return pagesize * pages

3390

return pagesize * pages

3377

except OSError: # sysconf can fail

3391

except OSError: # sysconf can fail

3378

pass

3392

pass

3379

except KeyError: # unknown parameter

3393

except KeyError: # unknown parameter

3380

pass

3394

pass

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages

             # util.py - Mercurial utility functions and platform specific implementations
             #
             #  Copyright 2005 K. Thananchayan <thananck@yahoo.com>
             #  Copyright 2005-2007 Olivia Mackall <olivia@selenic.com>
             #  Copyright 2006 Vadim Gelfer <vadim.gelfer@gmail.com>
             #
             # This software may be used and distributed according to the terms of the
             # GNU General Public License version 2 or any later version.
             """Mercurial utility functions and platform specific implementations.
             This contains helper routines that are independent of the SCM core and
             hide platform-specific details from the core.
             """
             from __future__ import absolute_import, print_function
             import abc
             import collections
             import contextlib
             import errno
             import gc
             import hashlib
             import itertools
             import locale
             import mmap
             import os
             import platform as pyplatform
             import re as remod
             import shutil
             import stat
             import sys
             import time
             import traceback
             import warnings
             from .node import hex
             from .thirdparty import attr
             from .pycompat import (
                 delattr,
                 getattr,
                 open,
                 setattr,
             )
             from .node import hex
             from hgdemandimport import tracing
             from . import (
                 encoding,
                 error,
                 i18n,
                 policy,
                 pycompat,
                 urllibcompat,
             )
             from .utils import (
                 compression,
                 hashutil,
                 procutil,
                 stringutil,
                 urlutil,
             )
             if pycompat.TYPE_CHECKING:
                 from typing import (
                     Iterator,
                     List,
                     Optional,
                     Tuple,
                 )
             base85 = policy.importmod('base85')
             osutil = policy.importmod('osutil')
             b85decode = base85.b85decode
             b85encode = base85.b85encode
             cookielib = pycompat.cookielib
             httplib = pycompat.httplib
             pickle = pycompat.pickle
             safehasattr = pycompat.safehasattr
             socketserver = pycompat.socketserver
             bytesio = pycompat.bytesio
             # TODO deprecate stringio name, as it is a lie on Python 3.
             stringio = bytesio
             xmlrpclib = pycompat.xmlrpclib
             httpserver = urllibcompat.httpserver
             urlerr = urllibcompat.urlerr
             urlreq = urllibcompat.urlreq
             # workaround for win32mbcs
             _filenamebytestr = pycompat.bytestr
             if pycompat.iswindows:
                 from . import windows as platform
             else:
                 from . import posix as platform
             _ = i18n._
             bindunixsocket = platform.bindunixsocket
             cachestat = platform.cachestat
             checkexec = platform.checkexec
             checklink = platform.checklink
             copymode = platform.copymode
             expandglobs = platform.expandglobs
             getfsmountpoint = platform.getfsmountpoint
             getfstype = platform.getfstype
             get_password = platform.get_password
             groupmembers = platform.groupmembers
             groupname = platform.groupname
             isexec = platform.isexec
             isowner = platform.isowner
             listdir = osutil.listdir
             localpath = platform.localpath
             lookupreg = platform.lookupreg
             makedir = platform.makedir
             nlinks = platform.nlinks
             normpath = platform.normpath
             normcase = platform.normcase
             normcasespec = platform.normcasespec
             normcasefallback = platform.normcasefallback
             openhardlinks = platform.openhardlinks
             oslink = platform.oslink
             parsepatchoutput = platform.parsepatchoutput
             pconvert = platform.pconvert
             poll = platform.poll
             posixfile = platform.posixfile
             readlink = platform.readlink
             rename = platform.rename
             removedirs = platform.removedirs
             samedevice = platform.samedevice
             samefile = platform.samefile
             samestat = platform.samestat
             setflags = platform.setflags
             split = platform.split
             statfiles = getattr(osutil, 'statfiles', platform.statfiles)
             statisexec = platform.statisexec
             statislink = platform.statislink
             umask = platform.umask
             unlink = platform.unlink
             username = platform.username
             def setumask(val):
                 # type: (int) -> None
                 '''updates the umask. used by chg server'''
                 if pycompat.iswindows:
                     return
                 os.umask(val)
                 global umask
                 platform.umask = umask = val & 0o777
             # small compat layer
             compengines = compression.compengines
             SERVERROLE = compression.SERVERROLE
             CLIENTROLE = compression.CLIENTROLE
             try:
                 recvfds = osutil.recvfds
             except AttributeError:
                 pass
             # Python compatibility
             _notset = object()
             def bitsfrom(container):
                 bits = 0
                 for bit in container:
                     bits |= bit
                 return bits
             # python 2.6 still have deprecation warning enabled by default. We do not want
             # to display anything to standard user so detect if we are running test and
             # only use python deprecation warning in this case.
             _dowarn = bool(encoding.environ.get(b'HGEMITWARNINGS'))
             if _dowarn:
                 # explicitly unfilter our warning for python 2.7
                 #
                 # The option of setting PYTHONWARNINGS in the test runner was investigated.
                 # However, module name set through PYTHONWARNINGS was exactly matched, so
                 # we cannot set 'mercurial' and have it match eg: 'mercurial.scmutil'. This
                 # makes the whole PYTHONWARNINGS thing useless for our usecase.
                 warnings.filterwarnings('default', '', DeprecationWarning, 'mercurial')
                 warnings.filterwarnings('default', '', DeprecationWarning, 'hgext')
                 warnings.filterwarnings('default', '', DeprecationWarning, 'hgext3rd')
             if _dowarn and pycompat.ispy3:
                 # silence warning emitted by passing user string to re.sub()
                 warnings.filterwarnings(
                     'ignore', 'bad escape', DeprecationWarning, 'mercurial'
                 )
                 warnings.filterwarnings(
                     'ignore', 'invalid escape sequence', DeprecationWarning, 'mercurial'
                 )
                 # TODO: reinvent imp.is_frozen()
                 warnings.filterwarnings(
                     'ignore',
                     'the imp module is deprecated',
                     DeprecationWarning,
                     'mercurial',
                 )
             def nouideprecwarn(msg, version, stacklevel=1):
                 """Issue an python native deprecation warning
                 This is a noop outside of tests, use 'ui.deprecwarn' when possible.
                 """
                 if _dowarn:
                     msg += (
                         b"\n(compatibility will be dropped after Mercurial-%s,"
                         b" update your code.)"
                     ) % version
                     warnings.warn(pycompat.sysstr(msg), DeprecationWarning, stacklevel + 1)
                     # on python 3 with chg, we will need to explicitly flush the output
                     sys.stderr.flush()
             DIGESTS = {
                 b'md5': hashlib.md5,
                 b'sha1': hashutil.sha1,
                 b'sha512': hashlib.sha512,
             }
             # List of digest types from strongest to weakest
             DIGESTS_BY_STRENGTH = [b'sha512', b'sha1', b'md5']
             for k in DIGESTS_BY_STRENGTH:
                 assert k in DIGESTS
             class digester(object):
                 """helper to compute digests.
                 This helper can be used to compute one or more digests given their name.
                 >>> d = digester([b'md5', b'sha1'])
                 >>> d.update(b'foo')
                 >>> [k for k in sorted(d)]
                 ['md5', 'sha1']
                 >>> d[b'md5']
                 'acbd18db4cc2f85cedef654fccc4a4d8'
                 >>> d[b'sha1']
                 '0beec7b5ea3f0fdbc95d0dd47f3c5bc275da8a33'
                 >>> digester.preferred([b'md5', b'sha1'])
                 'sha1'
                 """
                 def __init__(self, digests, s=b''):
                     self._hashes = {}
                     for k in digests:
                         if k not in DIGESTS:
                             raise error.Abort(_(b'unknown digest type: %s') % k)
                         self._hashes[k] = DIGESTS[k]()
                     if s:
                         self.update(s)
                 def update(self, data):
                     for h in self._hashes.values():
                         h.update(data)
                 def __getitem__(self, key):
                     if key not in DIGESTS:
                         raise error.Abort(_(b'unknown digest type: %s') % k)
                     return hex(self._hashes[key].digest())
                 def __iter__(self):
                     return iter(self._hashes)
                 @staticmethod
                 def preferred(supported):
                     """returns the strongest digest type in both supported and DIGESTS."""
                     for k in DIGESTS_BY_STRENGTH:
                         if k in supported:
                             return k
                     return None
             class digestchecker(object):
                 """file handle wrapper that additionally checks content against a given
                 size and digests.
                     d = digestchecker(fh, size, {'md5': '...'})
                 When multiple digests are given, all of them are validated.
                 """
                 def __init__(self, fh, size, digests):
                     self._fh = fh
                     self._size = size
                     self._got = 0
                     self._digests = dict(digests)
                     self._digester = digester(self._digests.keys())
                 def read(self, length=-1):
                     content = self._fh.read(length)
                     self._digester.update(content)
                     self._got += len(content)
                     return content
                 def validate(self):
                     if self._size != self._got:
                         raise error.Abort(
                             _(b'size mismatch: expected %d, got %d')
                             % (self._size, self._got)
                         )
                     for k, v in self._digests.items():
                         if v != self._digester[k]:
                             # i18n: first parameter is a digest name
                             raise error.Abort(
                                 _(b'%s mismatch: expected %s, got %s')
                                 % (k, v, self._digester[k])
                             )
             try:
                 buffer = buffer  # pytype: disable=name-error
             except NameError:
                 def buffer(sliceable, offset=0, length=None):
                     if length is not None:
                         return memoryview(sliceable)[offset : offset + length]
                     return memoryview(sliceable)[offset:]
             _chunksize = 4096
             class bufferedinputpipe(object):
                 """a manually buffered input pipe
                 Python will not let us use buffered IO and lazy reading with 'polling' at
                 the same time. We cannot probe the buffer state and select will not detect
                 that data are ready to read if they are already buffered.
                 This class let us work around that by implementing its own buffering
                 (allowing efficient readline) while offering a way to know if the buffer is
                 empty from the output (allowing collaboration of the buffer with polling).
                 This class lives in the 'util' module because it makes use of the 'os'
                 module from the python stdlib.
                 """
                 def __new__(cls, fh):
                     # If we receive a fileobjectproxy, we need to use a variation of this
                     # class that notifies observers about activity.
                     if isinstance(fh, fileobjectproxy):
                         cls = observedbufferedinputpipe
                     return super(bufferedinputpipe, cls).__new__(cls)
                 def __init__(self, input):
                     self._input = input
                     self._buffer = []
                     self._eof = False
                     self._lenbuf = 0
                 @property
                 def hasbuffer(self):
                     """True is any data is currently buffered
                     This will be used externally a pre-step for polling IO. If there is
                     already data then no polling should be set in place."""
                     return bool(self._buffer)
                 @property
                 def closed(self):
                     return self._input.closed
                 def fileno(self):
                     return self._input.fileno()
                 def close(self):
                     return self._input.close()
                 def read(self, size):
                     while (not self._eof) and (self._lenbuf < size):
                         self._fillbuffer()
                     return self._frombuffer(size)
                 def unbufferedread(self, size):
                     if not self._eof and self._lenbuf == 0:
                         self._fillbuffer(max(size, _chunksize))
                     return self._frombuffer(min(self._lenbuf, size))
                 def readline(self, *args, **kwargs):
                     if len(self._buffer) > 1:
                         # this should not happen because both read and readline end with a
                         # _frombuffer call that collapse it.
                         self._buffer = [b''.join(self._buffer)]
                         self._lenbuf = len(self._buffer[0])
                     lfi = -1
                     if self._buffer:
                         lfi = self._buffer[-1].find(b'\n')
                     while (not self._eof) and lfi < 0:
                         self._fillbuffer()
                         if self._buffer:
                             lfi = self._buffer[-1].find(b'\n')
                     size = lfi + 1
                     if lfi < 0:  # end of file
                         size = self._lenbuf
                     elif len(self._buffer) > 1:
                         # we need to take previous chunks into account
                         size += self._lenbuf - len(self._buffer[-1])
                     return self._frombuffer(size)
                 def _frombuffer(self, size):
                     """return at most 'size' data from the buffer
                     The data are removed from the buffer."""
                     if size == 0 or not self._buffer:
                         return b''
                     buf = self._buffer[0]
                     if len(self._buffer) > 1:
                         buf = b''.join(self._buffer)
                     data = buf[:size]
                     buf = buf[len(data) :]
                     if buf:
                         self._buffer = [buf]
                         self._lenbuf = len(buf)
                     else:
                         self._buffer = []
                         self._lenbuf = 0
                     return data
                 def _fillbuffer(self, size=_chunksize):
                     """read data to the buffer"""
                     data = os.read(self._input.fileno(), size)
                     if not data:
                         self._eof = True
                     else:
                         self._lenbuf += len(data)
                         self._buffer.append(data)
                     return data
             def mmapread(fp, size=None):
                 if size == 0:
                     # size of 0 to mmap.mmap() means "all data"
                     # rather than "zero bytes", so special case that.
                     return b''
                 elif size is None:
                     size = 0
                 try:
                     fd = getattr(fp, 'fileno', lambda: fp)()
                     return mmap.mmap(fd, size, access=mmap.ACCESS_READ)
                 except ValueError:
                     # Empty files cannot be mmapped, but mmapread should still work.  Check
                     # if the file is empty, and if so, return an empty buffer.
                     if os.fstat(fd).st_size == 0:
                         return b''
                     raise
             class fileobjectproxy(object):
                 """A proxy around file objects that tells a watcher when events occur.
                 This type is intended to only be used for testing purposes. Think hard
                 before using it in important code.
                 """
                 __slots__ = (
                     '_orig',
                     '_observer',
                 )
                 def __init__(self, fh, observer):
                     object.__setattr__(self, '_orig', fh)
                     object.__setattr__(self, '_observer', observer)
                 def __getattribute__(self, name):
                     ours = {
                         '_observer',
                         # IOBase
                         'close',
                         # closed if a property
                         'fileno',
                         'flush',
                         'isatty',
                         'readable',
                         'readline',
                         'readlines',
                         'seek',
                         'seekable',
                         'tell',
                         'truncate',
                         'writable',
                         'writelines',
                         # RawIOBase
                         'read',
                         'readall',
                         'readinto',
                         'write',
                         # BufferedIOBase
                         # raw is a property
                         'detach',
                         # read defined above
                         'read1',
                         # readinto defined above
                         # write defined above
                     }
                     # We only observe some methods.
                     if name in ours:
                         return object.__getattribute__(self, name)
                     return getattr(object.__getattribute__(self, '_orig'), name)
                 def __nonzero__(self):
                     return bool(object.__getattribute__(self, '_orig'))
                 __bool__ = __nonzero__
                 def __delattr__(self, name):
                     return delattr(object.__getattribute__(self, '_orig'), name)
                 def __setattr__(self, name, value):
                     return setattr(object.__getattribute__(self, '_orig'), name, value)
                 def __iter__(self):
                     return object.__getattribute__(self, '_orig').__iter__()
                 def _observedcall(self, name, *args, **kwargs):
                     # Call the original object.
                     orig = object.__getattribute__(self, '_orig')
                     res = getattr(orig, name)(*args, **kwargs)
                     # Call a method on the observer of the same name with arguments
                     # so it can react, log, etc.
                     observer = object.__getattribute__(self, '_observer')
                     fn = getattr(observer, name, None)
                     if fn:
                         fn(res, *args, **kwargs)
                     return res
                 def close(self, *args, **kwargs):
                     return object.__getattribute__(self, '_observedcall')(
                         'close', *args, **kwargs
                     )
                 def fileno(self, *args, **kwargs):
                     return object.__getattribute__(self, '_observedcall')(
                         'fileno', *args, **kwargs
                     )
                 def flush(self, *args, **kwargs):
                     return object.__getattribute__(self, '_observedcall')(
                         'flush', *args, **kwargs
                     )
                 def isatty(self, *args, **kwargs):
                     return object.__getattribute__(self, '_observedcall')(
                         'isatty', *args, **kwargs
                     )
                 def readable(self, *args, **kwargs):
                     return object.__getattribute__(self, '_observedcall')(
                         'readable', *args, **kwargs
                     )
                 def readline(self, *args, **kwargs):
                     return object.__getattribute__(self, '_observedcall')(
                         'readline', *args, **kwargs
                     )
                 def readlines(self, *args, **kwargs):
                     return object.__getattribute__(self, '_observedcall')(
                         'readlines', *args, **kwargs
                     )
                 def seek(self, *args, **kwargs):
                     return object.__getattribute__(self, '_observedcall')(
                         'seek', *args, **kwargs
                     )
                 def seekable(self, *args, **kwargs):
                     return object.__getattribute__(self, '_observedcall')(
                         'seekable', *args, **kwargs
                     )
                 def tell(self, *args, **kwargs):
                     return object.__getattribute__(self, '_observedcall')(
                         'tell', *args, **kwargs
                     )
                 def truncate(self, *args, **kwargs):
                     return object.__getattribute__(self, '_observedcall')(
                         'truncate', *args, **kwargs
                     )
                 def writable(self, *args, **kwargs):
                     return object.__getattribute__(self, '_observedcall')(
                         'writable', *args, **kwargs
                     )
                 def writelines(self, *args, **kwargs):
                     return object.__getattribute__(self, '_observedcall')(
                         'writelines', *args, **kwargs
                     )
                 def read(self, *args, **kwargs):
                     return object.__getattribute__(self, '_observedcall')(
                         'read', *args, **kwargs
                     )
                 def readall(self, *args, **kwargs):
                     return object.__getattribute__(self, '_observedcall')(
                         'readall', *args, **kwargs
                     )
                 def readinto(self, *args, **kwargs):
                     return object.__getattribute__(self, '_observedcall')(
                         'readinto', *args, **kwargs
                     )
                 def write(self, *args, **kwargs):
                     return object.__getattribute__(self, '_observedcall')(
                         'write', *args, **kwargs
                     )
                 def detach(self, *args, **kwargs):
                     return object.__getattribute__(self, '_observedcall')(
                         'detach', *args, **kwargs
                     )
                 def read1(self, *args, **kwargs):
                     return object.__getattribute__(self, '_observedcall')(
                         'read1', *args, **kwargs
                     )
             class observedbufferedinputpipe(bufferedinputpipe):
                 """A variation of bufferedinputpipe that is aware of fileobjectproxy.
                 ``bufferedinputpipe`` makes low-level calls to ``os.read()`` that
                 bypass ``fileobjectproxy``. Because of this, we need to make
                 ``bufferedinputpipe`` aware of these operations.
                 This variation of ``bufferedinputpipe`` can notify observers about
                 ``os.read()`` events. It also re-publishes other events, such as
                 ``read()`` and ``readline()``.
                 """
                 def _fillbuffer(self):
                     res = super(observedbufferedinputpipe, self)._fillbuffer()
                     fn = getattr(self._input._observer, 'osread', None)
                     if fn:
                         fn(res, _chunksize)
                     return res
                 # We use different observer methods because the operation isn't
                 # performed on the actual file object but on us.
                 def read(self, size):
                     res = super(observedbufferedinputpipe, self).read(size)
                     fn = getattr(self._input._observer, 'bufferedread', None)
                     if fn:
                         fn(res, size)
                     return res
                 def readline(self, *args, **kwargs):
                     res = super(observedbufferedinputpipe, self).readline(*args, **kwargs)
                     fn = getattr(self._input._observer, 'bufferedreadline', None)
                     if fn:
                         fn(res)
                     return res
             PROXIED_SOCKET_METHODS = {
                 'makefile',
                 'recv',
                 'recvfrom',
                 'recvfrom_into',
                 'recv_into',
                 'send',
                 'sendall',
                 'sendto',
                 'setblocking',
                 'settimeout',
                 'gettimeout',
                 'setsockopt',
             }
             class socketproxy(object):
                 """A proxy around a socket that tells a watcher when events occur.
                 This is like ``fileobjectproxy`` except for sockets.
                 This type is intended to only be used for testing purposes. Think hard
                 before using it in important code.
                 """
                 __slots__ = (
                     '_orig',
                     '_observer',
                 )
                 def __init__(self, sock, observer):
                     object.__setattr__(self, '_orig', sock)
                     object.__setattr__(self, '_observer', observer)
                 def __getattribute__(self, name):
                     if name in PROXIED_SOCKET_METHODS:
                         return object.__getattribute__(self, name)
                     return getattr(object.__getattribute__(self, '_orig'), name)
                 def __delattr__(self, name):
                     return delattr(object.__getattribute__(self, '_orig'), name)
                 def __setattr__(self, name, value):
                     return setattr(object.__getattribute__(self, '_orig'), name, value)
                 def __nonzero__(self):
                     return bool(object.__getattribute__(self, '_orig'))
                 __bool__ = __nonzero__
                 def _observedcall(self, name, *args, **kwargs):
                     # Call the original object.
                     orig = object.__getattribute__(self, '_orig')
                     res = getattr(orig, name)(*args, **kwargs)
                     # Call a method on the observer of the same name with arguments
                     # so it can react, log, etc.
                     observer = object.__getattribute__(self, '_observer')
                     fn = getattr(observer, name, None)
                     if fn:
                         fn(res, *args, **kwargs)
                     return res
                 def makefile(self, *args, **kwargs):
                     res = object.__getattribute__(self, '_observedcall')(
                         'makefile', *args, **kwargs
                     )
                     # The file object may be used for I/O. So we turn it into a
                     # proxy using our observer.
                     observer = object.__getattribute__(self, '_observer')
                     return makeloggingfileobject(
                         observer.fh,
                         res,
                         observer.name,
                         reads=observer.reads,
                         writes=observer.writes,
                         logdata=observer.logdata,
                         logdataapis=observer.logdataapis,
                     )
                 def recv(self, *args, **kwargs):
                     return object.__getattribute__(self, '_observedcall')(
                         'recv', *args, **kwargs
                     )
                 def recvfrom(self, *args, **kwargs):
                     return object.__getattribute__(self, '_observedcall')(
                         'recvfrom', *args, **kwargs
                     )
                 def recvfrom_into(self, *args, **kwargs):
                     return object.__getattribute__(self, '_observedcall')(
                         'recvfrom_into', *args, **kwargs
                     )
                 def recv_into(self, *args, **kwargs):
                     return object.__getattribute__(self, '_observedcall')(
                         'recv_info', *args, **kwargs
                     )
                 def send(self, *args, **kwargs):
                     return object.__getattribute__(self, '_observedcall')(
                         'send', *args, **kwargs
                     )
                 def sendall(self, *args, **kwargs):
                     return object.__getattribute__(self, '_observedcall')(
                         'sendall', *args, **kwargs
                     )
                 def sendto(self, *args, **kwargs):
                     return object.__getattribute__(self, '_observedcall')(
                         'sendto', *args, **kwargs
                     )
                 def setblocking(self, *args, **kwargs):
                     return object.__getattribute__(self, '_observedcall')(
                         'setblocking', *args, **kwargs
                     )
                 def settimeout(self, *args, **kwargs):
                     return object.__getattribute__(self, '_observedcall')(
                         'settimeout', *args, **kwargs
                     )
                 def gettimeout(self, *args, **kwargs):
                     return object.__getattribute__(self, '_observedcall')(
                         'gettimeout', *args, **kwargs
                     )
                 def setsockopt(self, *args, **kwargs):
                     return object.__getattribute__(self, '_observedcall')(
                         'setsockopt', *args, **kwargs
                     )
             class baseproxyobserver(object):
                 def __init__(self, fh, name, logdata, logdataapis):
                     self.fh = fh
                     self.name = name
                     self.logdata = logdata
                     self.logdataapis = logdataapis
                 def _writedata(self, data):
                     if not self.logdata:
                         if self.logdataapis:
                             self.fh.write(b'\n')
                             self.fh.flush()
                         return
                     # Simple case writes all data on a single line.
                     if b'\n' not in data:
                         if self.logdataapis:
                             self.fh.write(b': %s\n' % stringutil.escapestr(data))
                         else:
                             self.fh.write(
                                 b'%s>     %s\n' % (self.name, stringutil.escapestr(data))
                             )
                         self.fh.flush()
                         return
                     # Data with newlines is written to multiple lines.
                     if self.logdataapis:
                         self.fh.write(b':\n')
                     lines = data.splitlines(True)
                     for line in lines:
                         self.fh.write(
                             b'%s>     %s\n' % (self.name, stringutil.escapestr(line))
                         )
                     self.fh.flush()
             class fileobjectobserver(baseproxyobserver):
                 """Logs file object activity."""
                 def __init__(
                     self, fh, name, reads=True, writes=True, logdata=False, logdataapis=True
                 ):
                     super(fileobjectobserver, self).__init__(fh, name, logdata, logdataapis)
                     self.reads = reads
                     self.writes = writes
                 def read(self, res, size=-1):
                     if not self.reads:
                         return
                     # Python 3 can return None from reads at EOF instead of empty strings.
                     if res is None:
                         res = b''
                     if size == -1 and res == b'':
                         # Suppress pointless read(-1) calls that return
                         # nothing. These happen _a lot_ on Python 3, and there
                         # doesn't seem to be a better workaround to have matching
                         # Python 2 and 3 behavior. :(
                         return
                     if self.logdataapis:
                         self.fh.write(b'%s> read(%d) -> %d' % (self.name, size, len(res)))
                     self._writedata(res)
                 def readline(self, res, limit=-1):
                     if not self.reads:
                         return
                     if self.logdataapis:
                         self.fh.write(b'%s> readline() -> %d' % (self.name, len(res)))
                     self._writedata(res)
                 def readinto(self, res, dest):
                     if not self.reads:
                         return
                     if self.logdataapis:
                         self.fh.write(
                             b'%s> readinto(%d) -> %r' % (self.name, len(dest), res)
                         )
                     data = dest[0:res] if res is not None else b''
                     # _writedata() uses "in" operator and is confused by memoryview because
                     # characters are ints on Python 3.
                     if isinstance(data, memoryview):
                         data = data.tobytes()
                     self._writedata(data)
                 def write(self, res, data):
                     if not self.writes:
                         return
                     # Python 2 returns None from some write() calls. Python 3 (reasonably)
                     # returns the integer bytes written.
                     if res is None and data:
                         res = len(data)
                     if self.logdataapis:
                         self.fh.write(b'%s> write(%d) -> %r' % (self.name, len(data), res))
                     self._writedata(data)
                 def flush(self, res):
                     if not self.writes:
                         return
                     self.fh.write(b'%s> flush() -> %r\n' % (self.name, res))
                 # For observedbufferedinputpipe.
                 def bufferedread(self, res, size):
                     if not self.reads:
                         return
                     if self.logdataapis:
                         self.fh.write(
                             b'%s> bufferedread(%d) -> %d' % (self.name, size, len(res))
                         )
                     self._writedata(res)
                 def bufferedreadline(self, res):
                     if not self.reads:
                         return
                     if self.logdataapis:
                         self.fh.write(
                             b'%s> bufferedreadline() -> %d' % (self.name, len(res))
                         )
                     self._writedata(res)
             def makeloggingfileobject(
                 logh, fh, name, reads=True, writes=True, logdata=False, logdataapis=True
             ):
                 """Turn a file object into a logging file object."""
                 observer = fileobjectobserver(
                     logh,
                     name,
                     reads=reads,
                     writes=writes,
                     logdata=logdata,
                     logdataapis=logdataapis,
                 )
                 return fileobjectproxy(fh, observer)
             class socketobserver(baseproxyobserver):
                 """Logs socket activity."""
                 def __init__(
                     self,
                     fh,
                     name,
                     reads=True,
                     writes=True,
                     states=True,
                     logdata=False,
                     logdataapis=True,
                 ):
                     super(socketobserver, self).__init__(fh, name, logdata, logdataapis)
                     self.reads = reads
                     self.writes = writes
                     self.states = states
                 def makefile(self, res, mode=None, bufsize=None):
                     if not self.states:
                         return
                     self.fh.write(b'%s> makefile(%r, %r)\n' % (self.name, mode, bufsize))
                 def recv(self, res, size, flags=0):
                     if not self.reads:
                         return
                     if self.logdataapis:
                         self.fh.write(
                             b'%s> recv(%d, %d) -> %d' % (self.name, size, flags, len(res))
                         )
                     self._writedata(res)
                 def recvfrom(self, res, size, flags=0):
                     if not self.reads:
                         return
                     if self.logdataapis:
                         self.fh.write(
                             b'%s> recvfrom(%d, %d) -> %d'
                             % (self.name, size, flags, len(res[0]))
                         )
                     self._writedata(res[0])
                 def recvfrom_into(self, res, buf, size, flags=0):
                     if not self.reads:
                         return
                     if self.logdataapis:
                         self.fh.write(
                             b'%s> recvfrom_into(%d, %d) -> %d'
                             % (self.name, size, flags, res[0])
                         )
                     self._writedata(buf[0 : res[0]])
                 def recv_into(self, res, buf, size=0, flags=0):
                     if not self.reads:
                         return
                     if self.logdataapis:
                         self.fh.write(
                             b'%s> recv_into(%d, %d) -> %d' % (self.name, size, flags, res)
                         )
                     self._writedata(buf[0:res])
                 def send(self, res, data, flags=0):
                     if not self.writes:
                         return
                     self.fh.write(
                         b'%s> send(%d, %d) -> %d' % (self.name, len(data), flags, len(res))
                     )
                     self._writedata(data)
                 def sendall(self, res, data, flags=0):
                     if not self.writes:
                         return
                     if self.logdataapis:
                         # Returns None on success. So don't bother reporting return value.
                         self.fh.write(
                             b'%s> sendall(%d, %d)' % (self.name, len(data), flags)
                         )
                     self._writedata(data)
                 def sendto(self, res, data, flagsoraddress, address=None):
                     if not self.writes:
                         return
                     if address:
                         flags = flagsoraddress
                     else:
                         flags = 0
                     if self.logdataapis:
                         self.fh.write(
                             b'%s> sendto(%d, %d, %r) -> %d'
                             % (self.name, len(data), flags, address, res)
                         )
                     self._writedata(data)
                 def setblocking(self, res, flag):
                     if not self.states:
                         return
                     self.fh.write(b'%s> setblocking(%r)\n' % (self.name, flag))
                 def settimeout(self, res, value):
                     if not self.states:
                         return
                     self.fh.write(b'%s> settimeout(%r)\n' % (self.name, value))
                 def gettimeout(self, res):
                     if not self.states:
                         return
                     self.fh.write(b'%s> gettimeout() -> %f\n' % (self.name, res))
                 def setsockopt(self, res, level, optname, value):
                     if not self.states:
                         return
                     self.fh.write(
                         b'%s> setsockopt(%r, %r, %r) -> %r\n'
                         % (self.name, level, optname, value, res)
                     )
             def makeloggingsocket(
                 logh,
                 fh,
                 name,
                 reads=True,
                 writes=True,
                 states=True,
                 logdata=False,
                 logdataapis=True,
             ):
                 """Turn a socket into a logging socket."""
                 observer = socketobserver(
                     logh,
                     name,
                     reads=reads,
                     writes=writes,
                     states=states,
                     logdata=logdata,
                     logdataapis=logdataapis,
                 )
                 return socketproxy(fh, observer)
             def version():
                 """Return version information if available."""
                 try:
                     from . import __version__
                     return __version__.version
                 except ImportError:
                     return b'unknown'
             def versiontuple(v=None, n=4):
                 """Parses a Mercurial version string into an N-tuple.
                 The version string to be parsed is specified with the ``v`` argument.
                 If it isn't defined, the current Mercurial version string will be parsed.
                 ``n`` can be 2, 3, or 4. Here is how some version strings map to
                 returned values:
                 >>> v = b'3.6.1+190-df9b73d2d444'
                 >>> versiontuple(v, 2)
                 (3, 6)
                 >>> versiontuple(v, 3)
                 (3, 6, 1)
                 >>> versiontuple(v, 4)
                 (3, 6, 1, '190-df9b73d2d444')
                 >>> versiontuple(b'3.6.1+190-df9b73d2d444+20151118')
                 (3, 6, 1, '190-df9b73d2d444+20151118')
                 >>> v = b'3.6'
                 >>> versiontuple(v, 2)
                 (3, 6)
                 >>> versiontuple(v, 3)
                 (3, 6, None)
                 >>> versiontuple(v, 4)
                 (3, 6, None, None)
                 >>> v = b'3.9-rc'
                 >>> versiontuple(v, 2)
                 (3, 9)
                 >>> versiontuple(v, 3)
                 (3, 9, None)
                 >>> versiontuple(v, 4)
                 (3, 9, None, 'rc')
                 >>> v = b'3.9-rc+2-02a8fea4289b'
                 >>> versiontuple(v, 2)
                 (3, 9)
                 >>> versiontuple(v, 3)
                 (3, 9, None)
                 >>> versiontuple(v, 4)
                 (3, 9, None, 'rc+2-02a8fea4289b')
                 >>> versiontuple(b'4.6rc0')
                 (4, 6, None, 'rc0')
                 >>> versiontuple(b'4.6rc0+12-425d55e54f98')
                 (4, 6, None, 'rc0+12-425d55e54f98')
                 >>> versiontuple(b'.1.2.3')
                 (None, None, None, '.1.2.3')
                 >>> versiontuple(b'12.34..5')
                 (12, 34, None, '..5')
                 >>> versiontuple(b'1.2.3.4.5.6')
                 (1, 2, 3, '.4.5.6')
                 """
                 if not v:
                     v = version()
                 m = remod.match(br'(\d+(?:\.\d+){,2})[+-]?(.*)', v)
                 if not m:
                     vparts, extra = b'', v
                 elif m.group(2):
                     vparts, extra = m.groups()
                 else:
                     vparts, extra = m.group(1), None
                 assert vparts is not None  # help pytype
                 vints = []
                 for i in vparts.split(b'.'):
                     try:
                         vints.append(int(i))
                     except ValueError:
                         break
                 # (3, 6) -> (3, 6, None)
                 while len(vints) < 3:
                     vints.append(None)
                 if n == 2:
                     return (vints[0], vints[1])
                 if n == 3:
                     return (vints[0], vints[1], vints[2])
                 if n == 4:
                     return (vints[0], vints[1], vints[2], extra)
             def cachefunc(func):
                 '''cache the result of function calls'''
                 # XXX doesn't handle keywords args
                 if func.__code__.co_argcount == 0:
                     listcache = []
                     def f():
                         if len(listcache) == 0:
                             listcache.append(func())
                         return listcache[0]
                     return f
                 cache = {}
                 if func.__code__.co_argcount == 1:
                     # we gain a small amount of time because
                     # we don't need to pack/unpack the list
                     def f(arg):
                         if arg not in cache:
                             cache[arg] = func(arg)
                         return cache[arg]
                 else:
                     def f(*args):
                         if args not in cache:
                             cache[args] = func(*args)
                         return cache[args]
                 return f
             class cow(object):
                 """helper class to make copy-on-write easier
                 Call preparewrite before doing any writes.
                 """
                 def preparewrite(self):
                     """call this before writes, return self or a copied new object"""
                     if getattr(self, '_copied', 0):
                         self._copied -= 1
                         # Function cow.__init__ expects 1 arg(s), got 2 [wrong-arg-count]
                         return self.__class__(self)  # pytype: disable=wrong-arg-count
                     return self
                 def copy(self):
                     """always do a cheap copy"""
                     self._copied = getattr(self, '_copied', 0) + 1
                     return self
             class sortdict(collections.OrderedDict):
                 """a simple sorted dictionary
                 >>> d1 = sortdict([(b'a', 0), (b'b', 1)])
                 >>> d2 = d1.copy()
                 >>> d2
                 sortdict([('a', 0), ('b', 1)])
                 >>> d2.update([(b'a', 2)])
                 >>> list(d2.keys()) # should still be in last-set order
                 ['b', 'a']
                 >>> d1.insert(1, b'a.5', 0.5)
                 >>> d1
                 sortdict([('a', 0), ('a.5', 0.5), ('b', 1)])
                 """
                 def __setitem__(self, key, value):
                     if key in self:
                         del self[key]
                     super(sortdict, self).__setitem__(key, value)
                 if pycompat.ispypy:
                     # __setitem__() isn't called as of PyPy 5.8.0
                     def update(self, src, **f):
                         if isinstance(src, dict):
                             src = pycompat.iteritems(src)
                         for k, v in src:
                             self[k] = v
                         for k in f:
                             self[k] = f[k]
                 def insert(self, position, key, value):
                     for (i, (k, v)) in enumerate(list(self.items())):
                         if i == position:
                             self[key] = value
                         if i >= position:
                             del self[k]
                             self[k] = v
             class cowdict(cow, dict):
                 """copy-on-write dict
                 Be sure to call d = d.preparewrite() before writing to d.
                 >>> a = cowdict()
                 >>> a is a.preparewrite()
                 True
                 >>> b = a.copy()
                 >>> b is a
                 True
                 >>> c = b.copy()
                 >>> c is a
                 True
                 >>> a = a.preparewrite()
                 >>> b is a
                 False
                 >>> a is a.preparewrite()
                 True
                 >>> c = c.preparewrite()
                 >>> b is c
                 False
                 >>> b is b.preparewrite()
                 True
                 """
             class cowsortdict(cow, sortdict):
                 """copy-on-write sortdict
                 Be sure to call d = d.preparewrite() before writing to d.
                 """
             class transactional(object):  # pytype: disable=ignored-metaclass
                 """Base class for making a transactional type into a context manager."""
                 __metaclass__ = abc.ABCMeta
                 @abc.abstractmethod
                 def close(self):
                     """Successfully closes the transaction."""
                 @abc.abstractmethod
                 def release(self):
                     """Marks the end of the transaction.
                     If the transaction has not been closed, it will be aborted.
                     """
                 def __enter__(self):
                     return self
                 def __exit__(self, exc_type, exc_val, exc_tb):
                     try:
                         if exc_type is None:
                             self.close()
                     finally:
                         self.release()
             @contextlib.contextmanager
             def acceptintervention(tr=None):
                 """A context manager that closes the transaction on InterventionRequired
                 If no transaction was provided, this simply runs the body and returns
                 """
                 if not tr:
                     yield
                     return
                 try:
                     yield
                     tr.close()
                 except error.InterventionRequired:
                     tr.close()
                     raise
                 finally:
                     tr.release()
             @contextlib.contextmanager
             def nullcontextmanager(enter_result=None):
                 yield enter_result
             class _lrucachenode(object):
                 """A node in a doubly linked list.
                 Holds a reference to nodes on either side as well as a key-value
                 pair for the dictionary entry.
                 """
                 __slots__ = ('next', 'prev', 'key', 'value', 'cost')
                 def __init__(self):
                     self.next = self
                     self.prev = self
                     self.key = _notset
                     self.value = None
                     self.cost = 0
                 def markempty(self):
                     """Mark the node as emptied."""
                     self.key = _notset
                     self.value = None
                     self.cost = 0
             class lrucachedict(object):
                 """Dict that caches most recent accesses and sets.
                 The dict consists of an actual backing dict - indexed by original
                 key - and a doubly linked circular list defining the order of entries in
                 the cache.
                 The head node is the newest entry in the cache. If the cache is full,
                 we recycle head.prev and make it the new head. Cache accesses result in
                 the node being moved to before the existing head and being marked as the
                 new head node.
                 Items in the cache can be inserted with an optional "cost" value. This is
                 simply an integer that is specified by the caller. The cache can be queried
                 for the total cost of all items presently in the cache.
                 The cache can also define a maximum cost. If a cache insertion would
                 cause the total cost of the cache to go beyond the maximum cost limit,
                 nodes will be evicted to make room for the new code. This can be used
                 to e.g. set a max memory limit and associate an estimated bytes size
                 cost to each item in the cache. By default, no maximum cost is enforced.
                 """
                 def __init__(self, max, maxcost=0):
                     self._cache = {}
                     self._head = _lrucachenode()
                     self._size = 1
                     self.capacity = max
                     self.totalcost = 0
                     self.maxcost = maxcost
                 def __len__(self):
                     return len(self._cache)
                 def __contains__(self, k):
                     return k in self._cache
                 def __iter__(self):
                     # We don't have to iterate in cache order, but why not.
                     n = self._head
                     for i in range(len(self._cache)):
                         yield n.key
                         n = n.next
                 def __getitem__(self, k):
                     node = self._cache[k]
                     self._movetohead(node)
                     return node.value
                 def insert(self, k, v, cost=0):
                     """Insert a new item in the cache with optional cost value."""
                     node = self._cache.get(k)
                     # Replace existing value and mark as newest.
                     if node is not None:
                         self.totalcost -= node.cost
                         node.value = v
                         node.cost = cost
                         self.totalcost += cost
                         self._movetohead(node)
                         if self.maxcost:
                             self._enforcecostlimit()
                         return
                     if self._size < self.capacity:
                         node = self._addcapacity()
                     else:
                         # Grab the last/oldest item.
                         node = self._head.prev
                     # At capacity. Kill the old entry.
                     if node.key is not _notset:
                         self.totalcost -= node.cost
                         del self._cache[node.key]
                     node.key = k
                     node.value = v
                     node.cost = cost
                     self.totalcost += cost
                     self._cache[k] = node
                     # And mark it as newest entry. No need to adjust order since it
                     # is already self._head.prev.
                     self._head = node
                     if self.maxcost:
                         self._enforcecostlimit()
                 def __setitem__(self, k, v):
                     self.insert(k, v)
                 def __delitem__(self, k):
                     self.pop(k)
                 def pop(self, k, default=_notset):
                     try:
                         node = self._cache.pop(k)
                     except KeyError:
                         if default is _notset:
                             raise
                         return default
                     assert node is not None  # help pytype
                     value = node.value
                     self.totalcost -= node.cost
                     node.markempty()
                     # Temporarily mark as newest item before re-adjusting head to make
                     # this node the oldest item.
                     self._movetohead(node)
                     self._head = node.next
                     return value
                 # Additional dict methods.
                 def get(self, k, default=None):
                     try:
                         return self.__getitem__(k)
                     except KeyError:
                         return default
                 def peek(self, k, default=_notset):
                     """Get the specified item without moving it to the head
                     Unlike get(), this doesn't mutate the internal state. But be aware
                     that it doesn't mean peek() is thread safe.
                     """
                     try:
                         node = self._cache[k]
                         assert node is not None  # help pytype
                         return node.value
                     except KeyError:
                         if default is _notset:
                             raise
                         return default
                 def clear(self):
                     n = self._head
                     while n.key is not _notset:
                         self.totalcost -= n.cost
                         n.markempty()
                         n = n.next
                     self._cache.clear()
                 def copy(self, capacity=None, maxcost=0):
                     """Create a new cache as a copy of the current one.
                     By default, the new cache has the same capacity as the existing one.
                     But, the cache capacity can be changed as part of performing the
                     copy.
                     Items in the copy have an insertion/access order matching this
                     instance.
                     """
                     capacity = capacity or self.capacity
                     maxcost = maxcost or self.maxcost
                     result = lrucachedict(capacity, maxcost=maxcost)
                     # We copy entries by iterating in oldest-to-newest order so the copy
                     # has the correct ordering.
                     # Find the first non-empty entry.
                     n = self._head.prev
                     while n.key is _notset and n is not self._head:
                         n = n.prev
                     # We could potentially skip the first N items when decreasing capacity.
                     # But let's keep it simple unless it is a performance problem.
                     for i in range(len(self._cache)):
                         result.insert(n.key, n.value, cost=n.cost)
                         n = n.prev
                     return result
                 def popoldest(self):
                     """Remove the oldest item from the cache.
                     Returns the (key, value) describing the removed cache entry.
                     """
                     if not self._cache:
                         return
                     # Walk the linked list backwards starting at tail node until we hit
                     # a non-empty node.
                     n = self._head.prev
                     assert n is not None  # help pytype
                     while n.key is _notset:
                         n = n.prev
                     assert n is not None  # help pytype
                     key, value = n.key, n.value
                     # And remove it from the cache and mark it as empty.
                     del self._cache[n.key]
                     self.totalcost -= n.cost
                     n.markempty()
                     return key, value
                 def _movetohead(self, node):
                     """Mark a node as the newest, making it the new head.
                     When a node is accessed, it becomes the freshest entry in the LRU
                     list, which is denoted by self._head.
                     Visually, let's make ``N`` the new head node (* denotes head):
                         previous/oldest <-> head <-> next/next newest
                         ----<->--- A* ---<->-----
                         |                       |
                         E <-> D <-> N <-> C <-> B
                     To:
                         ----<->--- N* ---<->-----
                         |                       |
                         E <-> D <-> C <-> B <-> A
                     This requires the following moves:
                        C.next = D  (node.prev.next = node.next)
                        D.prev = C  (node.next.prev = node.prev)
                        E.next = N  (head.prev.next = node)
                        N.prev = E  (node.prev = head.prev)
                        N.next = A  (node.next = head)
                        A.prev = N  (head.prev = node)
                     """
                     head = self._head
                     # C.next = D
                     node.prev.next = node.next
                     # D.prev = C
                     node.next.prev = node.prev
                     # N.prev = E
                     node.prev = head.prev
                     # N.next = A
                     # It is tempting to do just "head" here, however if node is
                     # adjacent to head, this will do bad things.
                     node.next = head.prev.next
                     # E.next = N
                     node.next.prev = node
                     # A.prev = N
                     node.prev.next = node
                     self._head = node
                 def _addcapacity(self):
                     """Add a node to the circular linked list.
                     The new node is inserted before the head node.
                     """
                     head = self._head
                     node = _lrucachenode()
                     head.prev.next = node
                     node.prev = head.prev
                     node.next = head
                     head.prev = node
                     self._size += 1
                     return node
                 def _enforcecostlimit(self):
                     # This should run after an insertion. It should only be called if total
                     # cost limits are being enforced.
                     # The most recently inserted node is never evicted.
                     if len(self) <= 1 or self.totalcost <= self.maxcost:
                         return
                     # This is logically equivalent to calling popoldest() until we
                     # free up enough cost. We don't do that since popoldest() needs
                     # to walk the linked list and doing this in a loop would be
                     # quadratic. So we find the first non-empty node and then
                     # walk nodes until we free up enough capacity.
                     #
                     # If we only removed the minimum number of nodes to free enough
                     # cost at insert time, chances are high that the next insert would
                     # also require pruning. This would effectively constitute quadratic
                     # behavior for insert-heavy workloads. To mitigate this, we set a
                     # target cost that is a percentage of the max cost. This will tend
                     # to free more nodes when the high water mark is reached, which
                     # lowers the chances of needing to prune on the subsequent insert.
                     targetcost = int(self.maxcost * 0.75)
                     n = self._head.prev
                     while n.key is _notset:
                         n = n.prev
                     while len(self) > 1 and self.totalcost > targetcost:
                         del self._cache[n.key]
                         self.totalcost -= n.cost
                         n.markempty()
                         n = n.prev
             def lrucachefunc(func):
                 '''cache most recent results of function calls'''
                 cache = {}
                 order = collections.deque()
                 if func.__code__.co_argcount == 1:
                     def f(arg):
                         if arg not in cache:
                             if len(cache) > 20:
                                 del cache[order.popleft()]
                             cache[arg] = func(arg)
                         else:
                             order.remove(arg)
                         order.append(arg)
                         return cache[arg]
                 else:
                     def f(*args):
                         if args not in cache:
                             if len(cache) > 20:
                                 del cache[order.popleft()]
                             cache[args] = func(*args)
                         else:
                             order.remove(args)
                         order.append(args)
                         return cache[args]
                 return f
             class propertycache(object):
                 def __init__(self, func):
                     self.func = func
                     self.name = func.__name__
                 def __get__(self, obj, type=None):
                     result = self.func(obj)
                     self.cachevalue(obj, result)
                     return result
                 def cachevalue(self, obj, value):
                     # __dict__ assignment required to bypass __setattr__ (eg: repoview)
                     obj.__dict__[self.name] = value
             def clearcachedproperty(obj, prop):
                 '''clear a cached property value, if one has been set'''
                 prop = pycompat.sysstr(prop)
                 if prop in obj.__dict__:
                     del obj.__dict__[prop]
             def increasingchunks(source, min=1024, max=65536):
                 """return no less than min bytes per chunk while data remains,
                 doubling min after each chunk until it reaches max"""
                 def log2(x):
                     if not x:
                         return 0
                     i = 0
                     while x:
                         x >>= 1
                         i += 1
                     return i - 1
                 buf = []
                 blen = 0
                 for chunk in source:
                     buf.append(chunk)
                     blen += len(chunk)
                     if blen >= min:
                         if min < max:
                             min = min << 1
                             nmin = 1 << log2(blen)
                             if nmin > min:
                                 min = nmin
                             if min > max:
                                 min = max
                         yield b''.join(buf)
                         blen = 0
                         buf = []
                 if buf:
                     yield b''.join(buf)
             def always(fn):
                 return True
             def never(fn):
                 return False
             def nogc(func):
                 """disable garbage collector
                 Python's garbage collector triggers a GC each time a certain number of
                 container objects (the number being defined by gc.get_threshold()) are
                 allocated even when marked not to be tracked by the collector. Tracking has
                 no effect on when GCs are triggered, only on what objects the GC looks
                 into. As a workaround, disable GC while building complex (huge)
                 containers.
                 This garbage collector issue have been fixed in 2.7. But it still affect
                 CPython's performance.
                 """
                 def wrapper(*args, **kwargs):
                     gcenabled = gc.isenabled()
                     gc.disable()
                     try:
                         return func(*args, **kwargs)
                     finally:
                         if gcenabled:
                             gc.enable()
                 return wrapper
             if pycompat.ispypy:
                 # PyPy runs slower with gc disabled
                 nogc = lambda x: x
             def pathto(root, n1, n2):
                 # type: (bytes, bytes, bytes) -> bytes
                 """return the relative path from one place to another.
                 root should use os.sep to separate directories
                 n1 should use os.sep to separate directories
                 n2 should use "/" to separate directories
                 returns an os.sep-separated path.
                 If n1 is a relative path, it's assumed it's
                 relative to root.
                 n2 should always be relative to root.
                 """
                 if not n1:
                     return localpath(n2)
                 if os.path.isabs(n1):
                     if os.path.splitdrive(root)[0] != os.path.splitdrive(n1)[0]:
                         return os.path.join(root, localpath(n2))
                     n2 = b'/'.join((pconvert(root), n2))
                 a, b = splitpath(n1), n2.split(b'/')
                 a.reverse()
                 b.reverse()
                 while a and b and a[-1] == b[-1]:
                     a.pop()
                     b.pop()
                 b.reverse()
                 return pycompat.ossep.join(([b'..'] * len(a)) + b) or b'.'
             def checksignature(func, depth=1):
                 '''wrap a function with code to check for calling errors'''
                 def check(*args, **kwargs):
                     try:
                         return func(*args, **kwargs)
                     except TypeError:
                         if len(traceback.extract_tb(sys.exc_info()[2])) == depth:
                             raise error.SignatureError
                         raise
                 return check
             # a whilelist of known filesystems where hardlink works reliably
             _hardlinkfswhitelist = {
                 b'apfs',
                 b'btrfs',
                 b'ext2',
                 b'ext3',
                 b'ext4',
                 b'hfs',
                 b'jfs',
                 b'NTFS',
                 b'reiserfs',
                 b'tmpfs',
                 b'ufs',
                 b'xfs',
                 b'zfs',
             }
-            def copyfile(src, dest, hardlink=False, copystat=False, checkambig=False):
+            def copyfile(
+                src, dest, hardlink=False, copystat=False, checkambig=False, nb_bytes=None
+            ):
                 """copy a file, preserving mode and optionally other stat info like
                 atime/mtime
                 checkambig argument is used with filestat, and is useful only if
                 destination file is guarded by any lock (e.g. repo.lock or
                 repo.wlock).
                 copystat and checkambig should be exclusive.
+                nb_bytes: if set only copy the first `nb_bytes` of the source file.
                 """
                 assert not (copystat and checkambig)
                 oldstat = None
                 if os.path.lexists(dest):
                     if checkambig:
                         oldstat = checkambig and filestat.frompath(dest)
                     unlink(dest)
                 if hardlink:
                     # Hardlinks are problematic on CIFS (issue4546), do not allow hardlinks
                     # unless we are confident that dest is on a whitelisted filesystem.
                     try:
                         fstype = getfstype(os.path.dirname(dest))
                     except OSError:
                         fstype = None
                     if fstype not in _hardlinkfswhitelist:
                         hardlink = False
                 if hardlink:
                     try:
                         oslink(src, dest)
+                        if nb_bytes is not None:
+                            m = "the `nb_bytes` argument is incompatible with `hardlink`"
+                            raise error.ProgrammingError(m)
                         return
                     except (IOError, OSError):
                         pass  # fall back to normal copy
                 if os.path.islink(src):
                     os.symlink(os.readlink(src), dest)
                     # copytime is ignored for symlinks, but in general copytime isn't needed
                     # for them anyway
+                    if nb_bytes is not None:
+                        m = "cannot use `nb_bytes` on a symlink"
+                        raise error.ProgrammingError(m)
                 else:
                     try:
                         shutil.copyfile(src, dest)
                         if copystat:
                             # copystat also copies mode
                             shutil.copystat(src, dest)
                         else:
                             shutil.copymode(src, dest)
                             if oldstat and oldstat.stat:
                                 newstat = filestat.frompath(dest)
                                 if newstat.isambig(oldstat):
                                     # stat of copied file is ambiguous to original one
                                     advanced = (
                                         oldstat.stat[stat.ST_MTIME] + 1
                                     ) & 0x7FFFFFFF
                                     os.utime(dest, (advanced, advanced))
+                        # We could do something smarter using `copy_file_range` call or similar
+                        if nb_bytes is not None:
+                            with open(dest, mode='r+') as f:
+                                f.truncate(nb_bytes)
                     except shutil.Error as inst:
                         raise error.Abort(stringutil.forcebytestr(inst))
             def copyfiles(src, dst, hardlink=None, progress=None):
                 """Copy a directory tree using hardlinks if possible."""
                 num = 0
                 def settopic():
                     if progress:
                         progress.topic = _(b'linking') if hardlink else _(b'copying')
                 if os.path.isdir(src):
                     if hardlink is None:
                         hardlink = (
                             os.stat(src).st_dev == os.stat(os.path.dirname(dst)).st_dev
                         )
                     settopic()
                     os.mkdir(dst)
                     for name, kind in listdir(src):
                         srcname = os.path.join(src, name)
                         dstname = os.path.join(dst, name)
                         hardlink, n = copyfiles(srcname, dstname, hardlink, progress)
                         num += n
                 else:
                     if hardlink is None:
                         hardlink = (
                             os.stat(os.path.dirname(src)).st_dev
                             == os.stat(os.path.dirname(dst)).st_dev
                         )
                     settopic()
                     if hardlink:
                         try:
                             oslink(src, dst)
                         except (IOError, OSError):
                             hardlink = False
                             shutil.copy(src, dst)
                     else:
                         shutil.copy(src, dst)
                     num += 1
                     if progress:
                         progress.increment()
                 return hardlink, num
             _winreservednames = {
                 b'con',
                 b'prn',
                 b'aux',
                 b'nul',
                 b'com1',
                 b'com2',
                 b'com3',
                 b'com4',
                 b'com5',
                 b'com6',
                 b'com7',
                 b'com8',
                 b'com9',
                 b'lpt1',
                 b'lpt2',
                 b'lpt3',
                 b'lpt4',
                 b'lpt5',
                 b'lpt6',
                 b'lpt7',
                 b'lpt8',
                 b'lpt9',
             }
             _winreservedchars = b':*?"<>|'
             def checkwinfilename(path):
                 # type: (bytes) -> Optional[bytes]
                 r"""Check that the base-relative path is a valid filename on Windows.
                 Returns None if the path is ok, or a UI string describing the problem.
                 >>> checkwinfilename(b"just/a/normal/path")
                 >>> checkwinfilename(b"foo/bar/con.xml")
                 "filename contains 'con', which is reserved on Windows"
                 >>> checkwinfilename(b"foo/con.xml/bar")
                 "filename contains 'con', which is reserved on Windows"
                 >>> checkwinfilename(b"foo/bar/xml.con")
                 >>> checkwinfilename(b"foo/bar/AUX/bla.txt")
                 "filename contains 'AUX', which is reserved on Windows"
                 >>> checkwinfilename(b"foo/bar/bla:.txt")
                 "filename contains ':', which is reserved on Windows"
                 >>> checkwinfilename(b"foo/bar/b\07la.txt")
                 "filename contains '\\x07', which is invalid on Windows"
                 >>> checkwinfilename(b"foo/bar/bla ")
                 "filename ends with ' ', which is not allowed on Windows"
                 >>> checkwinfilename(b"../bar")
                 >>> checkwinfilename(b"foo\\")
                 "filename ends with '\\', which is invalid on Windows"
                 >>> checkwinfilename(b"foo\\/bar")
                 "directory name ends with '\\', which is invalid on Windows"
                 """
                 if path.endswith(b'\\'):
                     return _(b"filename ends with '\\', which is invalid on Windows")
                 if b'\\/' in path:
                     return _(b"directory name ends with '\\', which is invalid on Windows")
                 for n in path.replace(b'\\', b'/').split(b'/'):
                     if not n:
                         continue
                     for c in _filenamebytestr(n):
                         if c in _winreservedchars:
                             return (
                                 _(
                                     b"filename contains '%s', which is reserved "
                                     b"on Windows"
                                 )
                                 % c
                             )
                         if ord(c) <= 31:
                             return _(
                                 b"filename contains '%s', which is invalid on Windows"
                             ) % stringutil.escapestr(c)
                     base = n.split(b'.')[0]
                     if base and base.lower() in _winreservednames:
                         return (
                             _(b"filename contains '%s', which is reserved on Windows")
                             % base
                         )
                     t = n[-1:]
                     if t in b'. ' and n not in b'..':
                         return (
                             _(
                                 b"filename ends with '%s', which is not allowed "
                                 b"on Windows"
                             )
                             % t
                         )
             timer = getattr(time, "perf_counter", None)
             if pycompat.iswindows:
                 checkosfilename = checkwinfilename
                 if not timer:
                     timer = time.clock
             else:
                 # mercurial.windows doesn't have platform.checkosfilename
                 checkosfilename = platform.checkosfilename  # pytype: disable=module-attr
                 if not timer:
                     timer = time.time
             def makelock(info, pathname):
                 """Create a lock file atomically if possible
                 This may leave a stale lock file if symlink isn't supported and signal
                 interrupt is enabled.
                 """
                 try:
                     return os.symlink(info, pathname)
                 except OSError as why:
                     if why.errno == errno.EEXIST:
                         raise
                 except AttributeError:  # no symlink in os
                     pass
                 flags = os.O_CREAT | os.O_WRONLY | os.O_EXCL | getattr(os, 'O_BINARY', 0)
                 ld = os.open(pathname, flags)
                 os.write(ld, info)
                 os.close(ld)
             def readlock(pathname):
                 # type: (bytes) -> bytes
                 try:
                     return readlink(pathname)
                 except OSError as why:
                     if why.errno not in (errno.EINVAL, errno.ENOSYS):
                         raise
                 except AttributeError:  # no symlink in os
                     pass
                 with posixfile(pathname, b'rb') as fp:
                     return fp.read()
             def fstat(fp):
                 '''stat file object that may not have fileno method.'''
                 try:
                     return os.fstat(fp.fileno())
                 except AttributeError:
                     return os.stat(fp.name)
             # File system features
             def fscasesensitive(path):
                 # type: (bytes) -> bool
                 """
                 Return true if the given path is on a case-sensitive filesystem
                 Requires a path (like /foo/.hg) ending with a foldable final
                 directory component.
                 """
                 s1 = os.lstat(path)
                 d, b = os.path.split(path)
                 b2 = b.upper()
                 if b == b2:
                     b2 = b.lower()
                     if b == b2:
                         return True  # no evidence against case sensitivity
                 p2 = os.path.join(d, b2)
                 try:
                     s2 = os.lstat(p2)
                     if s2 == s1:
                         return False
                     return True
                 except OSError:
                     return True
             _re2_input = lambda x: x
             try:
                 import re2  # pytype: disable=import-error
                 _re2 = None
             except ImportError:
                 _re2 = False
             class _re(object):
                 def _checkre2(self):
                     global _re2
                     global _re2_input
                     check_pattern = br'\[([^\[]+)\]'
                     check_input = b'[ui]'
                     try:
                         # check if match works, see issue3964
                         _re2 = bool(re2.match(check_pattern, check_input))
                     except ImportError:
                         _re2 = False
                     except TypeError:
                         # the `pyre-2` project provides a re2 module that accept bytes
                         # the `fb-re2` project provides a re2 module that acccept sysstr
                         check_pattern = pycompat.sysstr(check_pattern)
                         check_input = pycompat.sysstr(check_input)
                         _re2 = bool(re2.match(check_pattern, check_input))
                         _re2_input = pycompat.sysstr
                 def compile(self, pat, flags=0):
                     """Compile a regular expression, using re2 if possible
                     For best performance, use only re2-compatible regexp features. The
                     only flags from the re module that are re2-compatible are
                     IGNORECASE and MULTILINE."""
                     if _re2 is None:
                         self._checkre2()
                     if _re2 and (flags & ~(remod.IGNORECASE | remod.MULTILINE)) == 0:
                         if flags & remod.IGNORECASE:
                             pat = b'(?i)' + pat
                         if flags & remod.MULTILINE:
                             pat = b'(?m)' + pat
                         try:
                             return re2.compile(_re2_input(pat))
                         except re2.error:
                             pass
                     return remod.compile(pat, flags)
                 @propertycache
                 def escape(self):
                     """Return the version of escape corresponding to self.compile.
                     This is imperfect because whether re2 or re is used for a particular
                     function depends on the flags, etc, but it's the best we can do.
                     """
                     global _re2
                     if _re2 is None:
                         self._checkre2()
                     if _re2:
                         return re2.escape
                     else:
                         return remod.escape
             re = _re()
             _fspathcache = {}
             def fspath(name, root):
                 # type: (bytes, bytes) -> bytes
                 """Get name in the case stored in the filesystem
                 The name should be relative to root, and be normcase-ed for efficiency.
                 Note that this function is unnecessary, and should not be
                 called, for case-sensitive filesystems (simply because it's expensive).
                 The root should be normcase-ed, too.
                 """
                 def _makefspathcacheentry(dir):
                     return {normcase(n): n for n in os.listdir(dir)}
                 seps = pycompat.ossep
                 if pycompat.osaltsep:
                     seps = seps + pycompat.osaltsep
                 # Protect backslashes. This gets silly very quickly.
                 seps.replace(b'\\', b'\\\\')
                 pattern = remod.compile(br'([^%s]+)|([%s]+)' % (seps, seps))
                 dir = os.path.normpath(root)
                 result = []
                 for part, sep in pattern.findall(name):
                     if sep:
                         result.append(sep)
                         continue
                     if dir not in _fspathcache:
                         _fspathcache[dir] = _makefspathcacheentry(dir)
                     contents = _fspathcache[dir]
                     found = contents.get(part)
                     if not found:
                         # retry "once per directory" per "dirstate.walk" which
                         # may take place for each patches of "hg qpush", for example
                         _fspathcache[dir] = contents = _makefspathcacheentry(dir)
                         found = contents.get(part)
                     result.append(found or part)
                     dir = os.path.join(dir, part)
                 return b''.join(result)
             def checknlink(testfile):
                 # type: (bytes) -> bool
                 '''check whether hardlink count reporting works properly'''
                 # testfile may be open, so we need a separate file for checking to
                 # work around issue2543 (or testfile may get lost on Samba shares)
                 f1, f2, fp = None, None, None
                 try:
                     fd, f1 = pycompat.mkstemp(
                         prefix=b'.%s-' % os.path.basename(testfile),
                         suffix=b'1~',
                         dir=os.path.dirname(testfile),
                     )
                     os.close(fd)
                     f2 = b'%s2~' % f1[:-2]
                     oslink(f1, f2)
                     # nlinks() may behave differently for files on Windows shares if
                     # the file is open.
                     fp = posixfile(f2)
                     return nlinks(f2) > 1
                 except OSError:
                     return False
                 finally:
                     if fp is not None:
                         fp.close()
                     for f in (f1, f2):
                         try:
                             if f is not None:
                                 os.unlink(f)
                         except OSError:
                             pass
             def endswithsep(path):
                 # type: (bytes) -> bool
                 '''Check path ends with os.sep or os.altsep.'''
                 return bool(  # help pytype
                     path.endswith(pycompat.ossep)
                     or pycompat.osaltsep
                     and path.endswith(pycompat.osaltsep)
                 )
             def splitpath(path):
                 # type: (bytes) -> List[bytes]
                 """Split path by os.sep.
                 Note that this function does not use os.altsep because this is
                 an alternative of simple "xxx.split(os.sep)".
                 It is recommended to use os.path.normpath() before using this
                 function if need."""
                 return path.split(pycompat.ossep)
             def mktempcopy(name, emptyok=False, createmode=None, enforcewritable=False):
                 """Create a temporary file with the same contents from name
                 The permission bits are copied from the original file.
                 If the temporary file is going to be truncated immediately, you
                 can use emptyok=True as an optimization.
                 Returns the name of the temporary file.
                 """
                 d, fn = os.path.split(name)
                 fd, temp = pycompat.mkstemp(prefix=b'.%s-' % fn, suffix=b'~', dir=d)
                 os.close(fd)
                 # Temporary files are created with mode 0600, which is usually not
                 # what we want.  If the original file already exists, just copy
                 # its mode.  Otherwise, manually obey umask.
                 copymode(name, temp, createmode, enforcewritable)
                 if emptyok:
                     return temp
                 try:
                     try:
                         ifp = posixfile(name, b"rb")
                     except IOError as inst:
                         if inst.errno == errno.ENOENT:
                             return temp
                         if not getattr(inst, 'filename', None):
                             inst.filename = name
                         raise
                     ofp = posixfile(temp, b"wb")
                     for chunk in filechunkiter(ifp):
                         ofp.write(chunk)
                     ifp.close()
                     ofp.close()
                 except:  # re-raises
                     try:
                         os.unlink(temp)
                     except OSError:
                         pass
                     raise
                 return temp
             class filestat(object):
                 """help to exactly detect change of a file
                 'stat' attribute is result of 'os.stat()' if specified 'path'
                 exists. Otherwise, it is None. This can avoid preparative
                 'exists()' examination on client side of this class.
                 """
                 def __init__(self, stat):
                     self.stat = stat
                 @classmethod
                 def frompath(cls, path):
                     try:
                         stat = os.stat(path)
                     except OSError as err:
                         if err.errno != errno.ENOENT:
                             raise
                         stat = None
                     return cls(stat)
                 @classmethod
                 def fromfp(cls, fp):
                     stat = os.fstat(fp.fileno())
                     return cls(stat)
                 __hash__ = object.__hash__
                 def __eq__(self, old):
                     try:
                         # if ambiguity between stat of new and old file is
                         # avoided, comparison of size, ctime and mtime is enough
                         # to exactly detect change of a file regardless of platform
                         return (
                             self.stat.st_size == old.stat.st_size
                             and self.stat[stat.ST_CTIME] == old.stat[stat.ST_CTIME]
                             and self.stat[stat.ST_MTIME] == old.stat[stat.ST_MTIME]
                         )
                     except AttributeError:
                         pass
                     try:
                         return self.stat is None and old.stat is None
                     except AttributeError:
                         return False
                 def isambig(self, old):
                     """Examine whether new (= self) stat is ambiguous against old one
                     "S[N]" below means stat of a file at N-th change:
                     - S[n-1].ctime  < S[n].ctime: can detect change of a file
                     - S[n-1].ctime == S[n].ctime
                       - S[n-1].ctime  < S[n].mtime: means natural advancing (*1)
                       - S[n-1].ctime == S[n].mtime: is ambiguous (*2)
                       - S[n-1].ctime  > S[n].mtime: never occurs naturally (don't care)
                     - S[n-1].ctime  > S[n].ctime: never occurs naturally (don't care)
                     Case (*2) above means that a file was changed twice or more at
                     same time in sec (= S[n-1].ctime), and comparison of timestamp
                     is ambiguous.
                     Base idea to avoid such ambiguity is "advance mtime 1 sec, if
                     timestamp is ambiguous".
                     But advancing mtime only in case (*2) doesn't work as
                     expected, because naturally advanced S[n].mtime in case (*1)
                     might be equal to manually advanced S[n-1 or earlier].mtime.
                     Therefore, all "S[n-1].ctime == S[n].ctime" cases should be
                     treated as ambiguous regardless of mtime, to avoid overlooking
                     by confliction between such mtime.
                     Advancing mtime "if isambig(oldstat)" ensures "S[n-1].mtime !=
                     S[n].mtime", even if size of a file isn't changed.
                     """
                     try:
                         return self.stat[stat.ST_CTIME] == old.stat[stat.ST_CTIME]
                     except AttributeError:
                         return False
                 def avoidambig(self, path, old):
                     """Change file stat of specified path to avoid ambiguity
                     'old' should be previous filestat of 'path'.
                     This skips avoiding ambiguity, if a process doesn't have
                     appropriate privileges for 'path'. This returns False in this
                     case.
                     Otherwise, this returns True, as "ambiguity is avoided".
                     """
                     advanced = (old.stat[stat.ST_MTIME] + 1) & 0x7FFFFFFF
                     try:
                         os.utime(path, (advanced, advanced))
                     except OSError as inst:
                         if inst.errno == errno.EPERM:
                             # utime() on the file created by another user causes EPERM,
                             # if a process doesn't have appropriate privileges
                             return False
                         raise
                     return True
                 def __ne__(self, other):
                     return not self == other
             class atomictempfile(object):
                 """writable file object that atomically updates a file
                 All writes will go to a temporary copy of the original file. Call
                 close() when you are done writing, and atomictempfile will rename
                 the temporary copy to the original name, making the changes
                 visible. If the object is destroyed without being closed, all your
                 writes are discarded.
                 checkambig argument of constructor is used with filestat, and is
                 useful only if target file is guarded by any lock (e.g. repo.lock
                 or repo.wlock).
                 """
                 def __init__(self, name, mode=b'w+b', createmode=None, checkambig=False):
                     self.__name = name  # permanent name
                     self._tempname = mktempcopy(
                         name,
                         emptyok=(b'w' in mode),
                         createmode=createmode,
                         enforcewritable=(b'w' in mode),
                     )
                     self._fp = posixfile(self._tempname, mode)
                     self._checkambig = checkambig
                     # delegated methods
                     self.read = self._fp.read
                     self.write = self._fp.write
                     self.seek = self._fp.seek
                     self.tell = self._fp.tell
                     self.fileno = self._fp.fileno
                 def close(self):
                     if not self._fp.closed:
                         self._fp.close()
                         filename = localpath(self.__name)
                         oldstat = self._checkambig and filestat.frompath(filename)
                         if oldstat and oldstat.stat:
                             rename(self._tempname, filename)
                             newstat = filestat.frompath(filename)
                             if newstat.isambig(oldstat):
                                 # stat of changed file is ambiguous to original one
                                 advanced = (oldstat.stat[stat.ST_MTIME] + 1) & 0x7FFFFFFF
                                 os.utime(filename, (advanced, advanced))
                         else:
                             rename(self._tempname, filename)
                 def discard(self):
                     if not self._fp.closed:
                         try:
                             os.unlink(self._tempname)
                         except OSError:
                             pass
                         self._fp.close()
                 def __del__(self):
                     if safehasattr(self, '_fp'):  # constructor actually did something
                         self.discard()
                 def __enter__(self):
                     return self
                 def __exit__(self, exctype, excvalue, traceback):
                     if exctype is not None:
                         self.discard()
                     else:
                         self.close()
             def unlinkpath(f, ignoremissing=False, rmdir=True):
                 # type: (bytes, bool, bool) -> None
                 """unlink and remove the directory if it is empty"""
                 if ignoremissing:
                     tryunlink(f)
                 else:
                     unlink(f)
                 if rmdir:
                     # try removing directories that might now be empty
                     try:
                         removedirs(os.path.dirname(f))
                     except OSError:
                         pass
             def tryunlink(f):
                 # type: (bytes) -> None
                 """Attempt to remove a file, ignoring ENOENT errors."""
                 try:
                     unlink(f)
                 except OSError as e:
                     if e.errno != errno.ENOENT:
                         raise
             def makedirs(name, mode=None, notindexed=False):
                 # type: (bytes, Optional[int], bool) -> None
                 """recursive directory creation with parent mode inheritance
                 Newly created directories are marked as "not to be indexed by
                 the content indexing service", if ``notindexed`` is specified
                 for "write" mode access.
                 """
                 try:
                     makedir(name, notindexed)
                 except OSError as err:
                     if err.errno == errno.EEXIST:
                         return
                     if err.errno != errno.ENOENT or not name:
                         raise
                     parent = os.path.dirname(os.path.abspath(name))
                     if parent == name:
                         raise
                     makedirs(parent, mode, notindexed)
                     try:
                         makedir(name, notindexed)
                     except OSError as err:
                         # Catch EEXIST to handle races
                         if err.errno == errno.EEXIST:
                             return
                         raise
                 if mode is not None:
                     os.chmod(name, mode)
             def readfile(path):
                 # type: (bytes) -> bytes
                 with open(path, b'rb') as fp:
                     return fp.read()
             def writefile(path, text):
                 # type: (bytes, bytes) -> None
                 with open(path, b'wb') as fp:
                     fp.write(text)
             def appendfile(path, text):
                 # type: (bytes, bytes) -> None
                 with open(path, b'ab') as fp:
                     fp.write(text)
             class chunkbuffer(object):
                 """Allow arbitrary sized chunks of data to be efficiently read from an
                 iterator over chunks of arbitrary size."""
                 def __init__(self, in_iter):
                     """in_iter is the iterator that's iterating over the input chunks."""
                     def splitbig(chunks):
                         for chunk in chunks:
                             if len(chunk) > 2 ** 20:
                                 pos = 0
                                 while pos < len(chunk):
                                     end = pos + 2 ** 18
                                     yield chunk[pos:end]
                                     pos = end
                             else:
                                 yield chunk
                     self.iter = splitbig(in_iter)
                     self._queue = collections.deque()
                     self._chunkoffset = 0
                 def read(self, l=None):
                     """Read L bytes of data from the iterator of chunks of data.
                     Returns less than L bytes if the iterator runs dry.
                     If size parameter is omitted, read everything"""
                     if l is None:
                         return b''.join(self.iter)
                     left = l
                     buf = []
                     queue = self._queue
                     while left > 0:
                         # refill the queue
                         if not queue:
                             target = 2 ** 18
                             for chunk in self.iter:
                                 queue.append(chunk)
                                 target -= len(chunk)
                                 if target <= 0:
                                     break
                             if not queue:
                                 break
                         # The easy way to do this would be to queue.popleft(), modify the
                         # chunk (if necessary), then queue.appendleft(). However, for cases
                         # where we read partial chunk content, this incurs 2 dequeue
                         # mutations and creates a new str for the remaining chunk in the
                         # queue. Our code below avoids this overhead.
                         chunk = queue[0]
                         chunkl = len(chunk)
                         offset = self._chunkoffset
                         # Use full chunk.
                         if offset == 0 and left >= chunkl:
                             left -= chunkl
                             queue.popleft()
                             buf.append(chunk)
                             # self._chunkoffset remains at 0.
                             continue
                         chunkremaining = chunkl - offset
                         # Use all of unconsumed part of chunk.
                         if left >= chunkremaining:
                             left -= chunkremaining
                             queue.popleft()
                             # offset == 0 is enabled by block above, so this won't merely
                             # copy via ``chunk[0:]``.
                             buf.append(chunk[offset:])
                             self._chunkoffset = 0
                         # Partial chunk needed.
                         else:
                             buf.append(chunk[offset : offset + left])
                             self._chunkoffset += left
                             left -= chunkremaining
                     return b''.join(buf)
             def filechunkiter(f, size=131072, limit=None):
                 """Create a generator that produces the data in the file size
                 (default 131072) bytes at a time, up to optional limit (default is
                 to read all data).  Chunks may be less than size bytes if the
                 chunk is the last chunk in the file, or the file is a socket or
                 some other type of file that sometimes reads less data than is
                 requested."""
                 assert size >= 0
                 assert limit is None or limit >= 0
                 while True:
                     if limit is None:
                         nbytes = size
                     else:
                         nbytes = min(limit, size)
                     s = nbytes and f.read(nbytes)
                     if not s:
                         break
                     if limit:
                         limit -= len(s)
                     yield s
             class cappedreader(object):
                 """A file object proxy that allows reading up to N bytes.
                 Given a source file object, instances of this type allow reading up to
                 N bytes from that source file object. Attempts to read past the allowed
                 limit are treated as EOF.
                 It is assumed that I/O is not performed on the original file object
                 in addition to I/O that is performed by this instance. If there is,
                 state tracking will get out of sync and unexpected results will ensue.
                 """
                 def __init__(self, fh, limit):
                     """Allow reading up to <limit> bytes from <fh>."""
                     self._fh = fh
                     self._left = limit
                 def read(self, n=-1):
                     if not self._left:
                         return b''
                     if n < 0:
                         n = self._left
                     data = self._fh.read(min(n, self._left))
                     self._left -= len(data)
                     assert self._left >= 0
                     return data
                 def readinto(self, b):
                     res = self.read(len(b))
                     if res is None:
                         return None
                     b[0 : len(res)] = res
                     return len(res)
             def unitcountfn(*unittable):
                 '''return a function that renders a readable count of some quantity'''
                 def go(count):
                     for multiplier, divisor, format in unittable:
                         if abs(count) >= divisor * multiplier:
                             return format % (count / float(divisor))
                     return unittable[-1][2] % count
                 return go
             def processlinerange(fromline, toline):
                 # type: (int, int) -> Tuple[int, int]
                 """Check that linerange <fromline>:<toline> makes sense and return a
 -based range.
                 >>> processlinerange(10, 20)
                 (9, 20)
                 >>> processlinerange(2, 1)
                 Traceback (most recent call last):
                     ...
                 ParseError: line range must be positive
                 >>> processlinerange(0, 5)
                 Traceback (most recent call last):
                     ...
                 ParseError: fromline must be strictly positive
                 """
                 if toline - fromline < 0:
                     raise error.ParseError(_(b"line range must be positive"))
                 if fromline < 1:
                     raise error.ParseError(_(b"fromline must be strictly positive"))
                 return fromline - 1, toline
             bytecount = unitcountfn(
                 (100, 1 << 30, _(b'%.0f GB')),
                 (10, 1 << 30, _(b'%.1f GB')),
                 (1, 1 << 30, _(b'%.2f GB')),
                 (100, 1 << 20, _(b'%.0f MB')),
                 (10, 1 << 20, _(b'%.1f MB')),
                 (1, 1 << 20, _(b'%.2f MB')),
                 (100, 1 << 10, _(b'%.0f KB')),
                 (10, 1 << 10, _(b'%.1f KB')),
                 (1, 1 << 10, _(b'%.2f KB')),
                 (1, 1, _(b'%.0f bytes')),
             )
             class transformingwriter(object):
                 """Writable file wrapper to transform data by function"""
                 def __init__(self, fp, encode):
                     self._fp = fp
                     self._encode = encode
                 def close(self):
                     self._fp.close()
                 def flush(self):
                     self._fp.flush()
                 def write(self, data):
                     return self._fp.write(self._encode(data))
             # Matches a single EOL which can either be a CRLF where repeated CR
             # are removed or a LF. We do not care about old Macintosh files, so a
             # stray CR is an error.
             _eolre = remod.compile(br'\r*\n')
             def tolf(s):
                 # type: (bytes) -> bytes
                 return _eolre.sub(b'\n', s)
             def tocrlf(s):
                 # type: (bytes) -> bytes
                 return _eolre.sub(b'\r\n', s)
             def _crlfwriter(fp):
                 return transformingwriter(fp, tocrlf)
             if pycompat.oslinesep == b'\r\n':
                 tonativeeol = tocrlf
                 fromnativeeol = tolf
                 nativeeolwriter = _crlfwriter
             else:
                 tonativeeol = pycompat.identity
                 fromnativeeol = pycompat.identity
                 nativeeolwriter = pycompat.identity
             if pyplatform.python_implementation() == b'CPython' and sys.version_info < (
 ,
 ,
             ):
                 # There is an issue in CPython that some IO methods do not handle EINTR
                 # correctly. The following table shows what CPython version (and functions)
                 # are affected (buggy: has the EINTR bug, okay: otherwise):
                 #
                 #                | < 2.7.4 | 2.7.4 to 2.7.12 | >= 3.0
                 #   --------------------------------------------------
                 #    fp.__iter__ | buggy   | buggy           | okay
                 #    fp.read*    | buggy   | okay [1]        | okay
                 #
                 # [1]: fixed by changeset 67dc99a989cd in the cpython hg repo.
                 #
                 # Here we workaround the EINTR issue for fileobj.__iter__. Other methods
                 # like "read*" work fine, as we do not support Python < 2.7.4.
                 #
                 # Although we can workaround the EINTR issue for fp.__iter__, it is slower:
                 # "for x in fp" is 4x faster than "for x in iter(fp.readline, '')" in
                 # CPython 2, because CPython 2 maintains an internal readahead buffer for
                 # fp.__iter__ but not other fp.read* methods.
                 #
                 # On modern systems like Linux, the "read" syscall cannot be interrupted
                 # when reading "fast" files like on-disk files. So the EINTR issue only
                 # affects things like pipes, sockets, ttys etc. We treat "normal" (S_ISREG)
                 # files approximately as "fast" files and use the fast (unsafe) code path,
                 # to minimize the performance impact.
                 def iterfile(fp):
                     fastpath = True
                     if type(fp) is file:
                         fastpath = stat.S_ISREG(os.fstat(fp.fileno()).st_mode)
                     if fastpath:
                         return fp
                     else:
                         # fp.readline deals with EINTR correctly, use it as a workaround.
                         return iter(fp.readline, b'')
             else:
                 # PyPy and CPython 3 do not have the EINTR issue thus no workaround needed.
                 def iterfile(fp):
                     return fp
             def iterlines(iterator):
                 # type: (Iterator[bytes]) -> Iterator[bytes]
                 for chunk in iterator:
                     for line in chunk.splitlines():
                         yield line
             def expandpath(path):
                 # type: (bytes) -> bytes
                 return os.path.expanduser(os.path.expandvars(path))
             def interpolate(prefix, mapping, s, fn=None, escape_prefix=False):
                 """Return the result of interpolating items in the mapping into string s.
                 prefix is a single character string, or a two character string with
                 a backslash as the first character if the prefix needs to be escaped in
                 a regular expression.
                 fn is an optional function that will be applied to the replacement text
                 just before replacement.
                 escape_prefix is an optional flag that allows using doubled prefix for
                 its escaping.
                 """
                 fn = fn or (lambda s: s)
                 patterns = b'|'.join(mapping.keys())
                 if escape_prefix:
                     patterns += b'|' + prefix
                     if len(prefix) > 1:
                         prefix_char = prefix[1:]
                     else:
                         prefix_char = prefix
                     mapping[prefix_char] = prefix_char
                 r = remod.compile(br'%s(%s)' % (prefix, patterns))
                 return r.sub(lambda x: fn(mapping[x.group()[1:]]), s)
             def getport(*args, **kwargs):
                 msg = b'getport(...) moved to mercurial.utils.urlutil'
                 nouideprecwarn(msg, b'6.0', stacklevel=2)
                 return urlutil.getport(*args, **kwargs)
             def url(*args, **kwargs):
                 msg = b'url(...) moved to mercurial.utils.urlutil'
                 nouideprecwarn(msg, b'6.0', stacklevel=2)
                 return urlutil.url(*args, **kwargs)
             def hasscheme(*args, **kwargs):
                 msg = b'hasscheme(...) moved to mercurial.utils.urlutil'
                 nouideprecwarn(msg, b'6.0', stacklevel=2)
                 return urlutil.hasscheme(*args, **kwargs)
             def hasdriveletter(*args, **kwargs):
                 msg = b'hasdriveletter(...) moved to mercurial.utils.urlutil'
                 nouideprecwarn(msg, b'6.0', stacklevel=2)
                 return urlutil.hasdriveletter(*args, **kwargs)
             def urllocalpath(*args, **kwargs):
                 msg = b'urllocalpath(...) moved to mercurial.utils.urlutil'
                 nouideprecwarn(msg, b'6.0', stacklevel=2)
                 return urlutil.urllocalpath(*args, **kwargs)
             def checksafessh(*args, **kwargs):
                 msg = b'checksafessh(...) moved to mercurial.utils.urlutil'
                 nouideprecwarn(msg, b'6.0', stacklevel=2)
                 return urlutil.checksafessh(*args, **kwargs)
             def hidepassword(*args, **kwargs):
                 msg = b'hidepassword(...) moved to mercurial.utils.urlutil'
                 nouideprecwarn(msg, b'6.0', stacklevel=2)
                 return urlutil.hidepassword(*args, **kwargs)
             def removeauth(*args, **kwargs):
                 msg = b'removeauth(...) moved to mercurial.utils.urlutil'
                 nouideprecwarn(msg, b'6.0', stacklevel=2)
                 return urlutil.removeauth(*args, **kwargs)
             timecount = unitcountfn(
                 (1, 1e3, _(b'%.0f s')),
                 (100, 1, _(b'%.1f s')),
                 (10, 1, _(b'%.2f s')),
                 (1, 1, _(b'%.3f s')),
                 (100, 0.001, _(b'%.1f ms')),
                 (10, 0.001, _(b'%.2f ms')),
                 (1, 0.001, _(b'%.3f ms')),
                 (100, 0.000001, _(b'%.1f us')),
                 (10, 0.000001, _(b'%.2f us')),
                 (1, 0.000001, _(b'%.3f us')),
                 (100, 0.000000001, _(b'%.1f ns')),
                 (10, 0.000000001, _(b'%.2f ns')),
                 (1, 0.000000001, _(b'%.3f ns')),
             )
             @attr.s
             class timedcmstats(object):
                 """Stats information produced by the timedcm context manager on entering."""
                 # the starting value of the timer as a float (meaning and resulution is
                 # platform dependent, see util.timer)
                 start = attr.ib(default=attr.Factory(lambda: timer()))
                 # the number of seconds as a floating point value; starts at 0, updated when
                 # the context is exited.
                 elapsed = attr.ib(default=0)
                 # the number of nested timedcm context managers.
                 level = attr.ib(default=1)
                 def __bytes__(self):
                     return timecount(self.elapsed) if self.elapsed else b'<unknown>'
                 __str__ = encoding.strmethod(__bytes__)
             @contextlib.contextmanager
             def timedcm(whencefmt, *whenceargs):
                 """A context manager that produces timing information for a given context.
                 On entering a timedcmstats instance is produced.
                 This context manager is reentrant.
                 """
                 # track nested context managers
                 timedcm._nested += 1
                 timing_stats = timedcmstats(level=timedcm._nested)
                 try:
                     with tracing.log(whencefmt, *whenceargs):
                         yield timing_stats
                 finally:
                     timing_stats.elapsed = timer() - timing_stats.start
                     timedcm._nested -= 1
             timedcm._nested = 0
             def timed(func):
                 """Report the execution time of a function call to stderr.
                 During development, use as a decorator when you need to measure
                 the cost of a function, e.g. as follows:
                 @util.timed
                 def foo(a, b, c):
                     pass
                 """
                 def wrapper(*args, **kwargs):
                     with timedcm(pycompat.bytestr(func.__name__)) as time_stats:
                         result = func(*args, **kwargs)
                     stderr = procutil.stderr
                     stderr.write(
                         b'%s%s: %s\n'
                         % (
                             b' ' * time_stats.level * 2,
                             pycompat.bytestr(func.__name__),
                             time_stats,
                         )
                     )
                     return result
                 return wrapper
             _sizeunits = (
                 (b'm', 2 ** 20),
                 (b'k', 2 ** 10),
                 (b'g', 2 ** 30),
                 (b'kb', 2 ** 10),
                 (b'mb', 2 ** 20),
                 (b'gb', 2 ** 30),
                 (b'b', 1),
             )
             def sizetoint(s):
                 # type: (bytes) -> int
                 """Convert a space specifier to a byte count.
                 >>> sizetoint(b'30')
                 >>> sizetoint(b'2.2kb')
                 >>> sizetoint(b'6M')
                 6291456
                 """
                 t = s.strip().lower()
                 try:
                     for k, u in _sizeunits:
                         if t.endswith(k):
                             return int(float(t[: -len(k)]) * u)
                     return int(t)
                 except ValueError:
                     raise error.ParseError(_(b"couldn't parse size: %s") % s)
             class hooks(object):
                 """A collection of hook functions that can be used to extend a
                 function's behavior. Hooks are called in lexicographic order,
                 based on the names of their sources."""
                 def __init__(self):
                     self._hooks = []
                 def add(self, source, hook):
                     self._hooks.append((source, hook))
                 def __call__(self, *args):
                     self._hooks.sort(key=lambda x: x[0])
                     results = []
                     for source, hook in self._hooks:
                         results.append(hook(*args))
                     return results
             def getstackframes(skip=0, line=b' %-*s in %s\n', fileline=b'%s:%d', depth=0):
                 """Yields lines for a nicely formatted stacktrace.
                 Skips the 'skip' last entries, then return the last 'depth' entries.
                 Each file+linenumber is formatted according to fileline.
                 Each line is formatted according to line.
                 If line is None, it yields:
                   length of longest filepath+line number,
                   filepath+linenumber,
                   function
                 Not be used in production code but very convenient while developing.
                 """
                 entries = [
                     (fileline % (pycompat.sysbytes(fn), ln), pycompat.sysbytes(func))
                     for fn, ln, func, _text in traceback.extract_stack()[: -skip - 1]
                 ][-depth:]
                 if entries:
                     fnmax = max(len(entry[0]) for entry in entries)
                     for fnln, func in entries:
                         if line is None:
                             yield (fnmax, fnln, func)
                         else:
                             yield line % (fnmax, fnln, func)
             def debugstacktrace(
                 msg=b'stacktrace',
                 skip=0,
                 f=procutil.stderr,
                 otherf=procutil.stdout,
                 depth=0,
                 prefix=b'',
             ):
                 """Writes a message to f (stderr) with a nicely formatted stacktrace.
                 Skips the 'skip' entries closest to the call, then show 'depth' entries.
                 By default it will flush stdout first.
                 It can be used everywhere and intentionally does not require an ui object.
                 Not be used in production code but very convenient while developing.
                 """
                 if otherf:
                     otherf.flush()
                 f.write(b'%s%s at:\n' % (prefix, msg.rstrip()))
                 for line in getstackframes(skip + 1, depth=depth):
                     f.write(prefix + line)
                 f.flush()
             # convenient shortcut
             dst = debugstacktrace
             def safename(f, tag, ctx, others=None):
                 """
                 Generate a name that it is safe to rename f to in the given context.
                 f:      filename to rename
                 tag:    a string tag that will be included in the new name
                 ctx:    a context, in which the new name must not exist
                 others: a set of other filenames that the new name must not be in
                 Returns a file name of the form oldname~tag[~number] which does not exist
                 in the provided context and is not in the set of other names.
                 """
                 if others is None:
                     others = set()
                 fn = b'%s~%s' % (f, tag)
                 if fn not in ctx and fn not in others:
                     return fn
                 for n in itertools.count(1):
                     fn = b'%s~%s~%s' % (f, tag, n)
                     if fn not in ctx and fn not in others:
                         return fn
             def readexactly(stream, n):
                 '''read n bytes from stream.read and abort if less was available'''
                 s = stream.read(n)
                 if len(s) < n:
                     raise error.Abort(
                         _(b"stream ended unexpectedly (got %d bytes, expected %d)")
                         % (len(s), n)
                     )
                 return s
             def uvarintencode(value):
                 """Encode an unsigned integer value to a varint.
                 A varint is a variable length integer of 1 or more bytes. Each byte
                 except the last has the most significant bit set. The lower 7 bits of
                 each byte store the 2's complement representation, least significant group
                 first.
                 >>> uvarintencode(0)
                 '\\x00'
                 >>> uvarintencode(1)
                 '\\x01'
                 >>> uvarintencode(127)
                 '\\x7f'
                 >>> uvarintencode(1337)
                 '\\xb9\\n'
                 >>> uvarintencode(65536)
                 '\\x80\\x80\\x04'
                 >>> uvarintencode(-1)
                 Traceback (most recent call last):
                     ...
                 ProgrammingError: negative value for uvarint: -1
                 """
                 if value < 0:
                     raise error.ProgrammingError(b'negative value for uvarint: %d' % value)
                 bits = value & 0x7F
                 value >>= 7
                 bytes = []
                 while value:
                     bytes.append(pycompat.bytechr(0x80 | bits))
                     bits = value & 0x7F
                     value >>= 7
                 bytes.append(pycompat.bytechr(bits))
                 return b''.join(bytes)
             def uvarintdecodestream(fh):
                 """Decode an unsigned variable length integer from a stream.
                 The passed argument is anything that has a ``.read(N)`` method.
                 >>> try:
                 ...     from StringIO import StringIO as BytesIO
                 ... except ImportError:
                 ...     from io import BytesIO
                 >>> uvarintdecodestream(BytesIO(b'\\x00'))
                 >>> uvarintdecodestream(BytesIO(b'\\x01'))
                 >>> uvarintdecodestream(BytesIO(b'\\x7f'))
                 >>> uvarintdecodestream(BytesIO(b'\\xb9\\n'))
                 >>> uvarintdecodestream(BytesIO(b'\\x80\\x80\\x04'))
                 >>> uvarintdecodestream(BytesIO(b'\\x80'))
                 Traceback (most recent call last):
                     ...
                 Abort: stream ended unexpectedly (got 0 bytes, expected 1)
                 """
                 result = 0
                 shift = 0
                 while True:
                     byte = ord(readexactly(fh, 1))
                     result |= (byte & 0x7F) << shift
                     if not (byte & 0x80):
                         return result
                     shift += 7
             # Passing the '' locale means that the locale should be set according to the
             # user settings (environment variables).
             # Python sometimes avoids setting the global locale settings. When interfacing
             # with C code (e.g. the curses module or the Subversion bindings), the global
             # locale settings must be initialized correctly. Python 2 does not initialize
             # the global locale settings on interpreter startup. Python 3 sometimes
             # initializes LC_CTYPE, but not consistently at least on Windows. Therefore we
             # explicitly initialize it to get consistent behavior if it's not already
             # initialized. Since CPython commit 177d921c8c03d30daa32994362023f777624b10d,
             # LC_CTYPE is always initialized. If we require Python 3.8+, we should re-check
             # if we can remove this code.
             @contextlib.contextmanager
             def with_lc_ctype():
                 oldloc = locale.setlocale(locale.LC_CTYPE, None)
                 if oldloc == 'C':
                     try:
                         try:
                             locale.setlocale(locale.LC_CTYPE, '')
                         except locale.Error:
                             # The likely case is that the locale from the environment
                             # variables is unknown.
                             pass
                         yield
                     finally:
                         locale.setlocale(locale.LC_CTYPE, oldloc)
                 else:
                     yield
             def _estimatememory():
                 # type: () -> Optional[int]
                 """Provide an estimate for the available system memory in Bytes.
                 If no estimate can be provided on the platform, returns None.
                 """
                 if pycompat.sysplatform.startswith(b'win'):
                     # On Windows, use the GlobalMemoryStatusEx kernel function directly.
                     from ctypes import c_long as DWORD, c_ulonglong as DWORDLONG
                     from ctypes.wintypes import (  # pytype: disable=import-error
                         Structure,
                         byref,
                         sizeof,
                         windll,
                     )
                     class MEMORYSTATUSEX(Structure):
                         _fields_ = [
                             ('dwLength', DWORD),
                             ('dwMemoryLoad', DWORD),
                             ('ullTotalPhys', DWORDLONG),
                             ('ullAvailPhys', DWORDLONG),
                             ('ullTotalPageFile', DWORDLONG),
                             ('ullAvailPageFile', DWORDLONG),
                             ('ullTotalVirtual', DWORDLONG),
                             ('ullAvailVirtual', DWORDLONG),
                             ('ullExtendedVirtual', DWORDLONG),
                         ]
                     x = MEMORYSTATUSEX()
                     x.dwLength = sizeof(x)
                     windll.kernel32.GlobalMemoryStatusEx(byref(x))
                     return x.ullAvailPhys
                 # On newer Unix-like systems and Mac OSX, the sysconf interface
                 # can be used. _SC_PAGE_SIZE is part of POSIX; _SC_PHYS_PAGES
                 # seems to be implemented on most systems.
                 try:
                     pagesize = os.sysconf(os.sysconf_names['SC_PAGE_SIZE'])
                     pages = os.sysconf(os.sysconf_names['SC_PHYS_PAGES'])
                     return pagesize * pages
                 except OSError:  # sysconf can fail
                     pass
                 except KeyError:  # unknown parameter
                     pass