upstream/mercurial-mirror Commit - r49814:9ac1a450

1

# pycompat.py - portability shim for python 3

1

# pycompat.py - portability shim for python 3

2

#

2

#

3

# This software may be used and distributed according to the terms of the

3

# This software may be used and distributed according to the terms of the

4

# GNU General Public License version 2 or any later version.

4

# GNU General Public License version 2 or any later version.

5

6

"""Mercurial portability shim for python 3.

6

"""Mercurial portability shim for python 3.

7

8

This contains aliases to hide python version-specific details from the core.

8

This contains aliases to hide python version-specific details from the core.

9

"""

9

"""

10

11

12

import builtins

12

import builtins

13

import codecs

13

import codecs

14

import concurrent.futures as futures

14

import concurrent.futures as futures

15

import functools

15

import functools

16

import getopt

16

import getopt

17

import http.client as httplib

17

import http.client as httplib

18

import http.cookiejar as cookielib

18

import http.cookiejar as cookielib

19

import inspect

19

import inspect

20

import io

20

import io

21

import json

21

import json

22

import os

22

import os

23

import pickle

23

import pickle

24

import queue

24

import queue

25

import shlex

25

import shlex

26

import socketserver

26

import socketserver

27

import struct

27

import struct

28

import sys

28

import sys

29

import tempfile

29

import tempfile

30

import xmlrpc.client as xmlrpclib

30

import xmlrpc.client as xmlrpclib

31

32

33

ispy3 = sys.version_info[0] >= 3

33

ispy3 = sys.version_info[0] >= 3

34

ispypy = '__pypy__' in sys.builtin_module_names

34

ispypy = '__pypy__' in sys.builtin_module_names

35

TYPE_CHECKING = False

35

TYPE_CHECKING = False

36

37

if not globals(): # hide this from non-pytype users

37

if not globals(): # hide this from non-pytype users

38

import typing

38

import typing

39

40

TYPE_CHECKING = typing.TYPE_CHECKING

40

TYPE_CHECKING = typing.TYPE_CHECKING

41

42

43

def future_set_exception_info(f, exc_info):

43

def future_set_exception_info(f, exc_info):

44

f.set_exception(exc_info[0])

44

f.set_exception(exc_info[0])

45

46

47

FileNotFoundError = builtins.FileNotFoundError

47

FileNotFoundError = builtins.FileNotFoundError

48

49

50

def identity(a):

50

def identity(a):

51

return a

51

return a

52

53

54

def _rapply(f, xs):

54

def _rapply(f, xs):

55

if xs is None:

55

if xs is None:

56

# assume None means non-value of optional data

56

# assume None means non-value of optional data

57

return xs

57

return xs

58

if isinstance(xs, (list, set, tuple)):

58

if isinstance(xs, (list, set, tuple)):

59

return type(xs)(_rapply(f, x) for x in xs)

59

return type(xs)(_rapply(f, x) for x in xs)

60

if isinstance(xs, dict):

60

if isinstance(xs, dict):

61

return type(xs)((_rapply(f, k), _rapply(f, v)) for k, v in xs.items())

61

return type(xs)((_rapply(f, k), _rapply(f, v)) for k, v in xs.items())

62

return f(xs)

62

return f(xs)

63

64

65

def rapply(f, xs):

65

def rapply(f, xs):

66

"""Apply function recursively to every item preserving the data structure

66

"""Apply function recursively to every item preserving the data structure

67

68

>>> def f(x):

68

>>> def f(x):

69

... return 'f(%s)' % x

69

... return 'f(%s)' % x

70

>>> rapply(f, None) is None

70

>>> rapply(f, None) is None

71

True

71

True

72

>>> rapply(f, 'a')

72

>>> rapply(f, 'a')

73

'f(a)'

73

'f(a)'

74

>>> rapply(f, {'a'}) == {'f(a)'}

74

>>> rapply(f, {'a'}) == {'f(a)'}

75

True

75

True

76

>>> rapply(f, ['a', 'b', None, {'c': 'd'}, []])

76

>>> rapply(f, ['a', 'b', None, {'c': 'd'}, []])

77

['f(a)', 'f(b)', None, {'f(c)': 'f(d)'}, []]

77

['f(a)', 'f(b)', None, {'f(c)': 'f(d)'}, []]

78

79

>>> xs = [object()]

79

>>> xs = [object()]

80

>>> rapply(identity, xs) is xs

80

>>> rapply(identity, xs) is xs

81

True

81

True

82

"""

82

"""

83

if f is identity:

83

if f is identity:

84

# fast path mainly for py2

84

# fast path mainly for py2

85

return xs

85

return xs

86

return _rapply(f, xs)

86

return _rapply(f, xs)

87

88

89

if os.name == r'nt' and sys.version_info >= (3, 6):

89

if os.name == r'nt':

90

# MBCS (or ANSI) filesystem encoding must be used as before.

90

# MBCS (or ANSI) filesystem encoding must be used as before.

91

# Otherwise non-ASCII filenames in existing repositories would be

91

# Otherwise non-ASCII filenames in existing repositories would be

92

# corrupted.

92

# corrupted.

93

# This must be set once prior to any fsencode/fsdecode calls.

93

# This must be set once prior to any fsencode/fsdecode calls.

94

sys._enablelegacywindowsfsencoding() # pytype: disable=module-attr

94

sys._enablelegacywindowsfsencoding() # pytype: disable=module-attr

95

96

fsencode = os.fsencode

96

fsencode = os.fsencode

97

fsdecode = os.fsdecode

97

fsdecode = os.fsdecode

98

oscurdir = os.curdir.encode('ascii')

98

oscurdir = os.curdir.encode('ascii')

99

oslinesep = os.linesep.encode('ascii')

99

oslinesep = os.linesep.encode('ascii')

100

osname = os.name.encode('ascii')

100

osname = os.name.encode('ascii')

101

ospathsep = os.pathsep.encode('ascii')

101

ospathsep = os.pathsep.encode('ascii')

102

ospardir = os.pardir.encode('ascii')

102

ospardir = os.pardir.encode('ascii')

103

ossep = os.sep.encode('ascii')

103

ossep = os.sep.encode('ascii')

104

osaltsep = os.altsep

104

osaltsep = os.altsep

105

if osaltsep:

105

if osaltsep:

106

osaltsep = osaltsep.encode('ascii')

106

osaltsep = osaltsep.encode('ascii')

107

osdevnull = os.devnull.encode('ascii')

107

osdevnull = os.devnull.encode('ascii')

108

109

sysplatform = sys.platform.encode('ascii')

109

sysplatform = sys.platform.encode('ascii')

110

sysexecutable = sys.executable

110

sysexecutable = sys.executable

111

if sysexecutable:

111

if sysexecutable:

112

sysexecutable = os.fsencode(sysexecutable)

112

sysexecutable = os.fsencode(sysexecutable)

113

114

115

def maplist(*args):

115

def maplist(*args):

116

return list(map(*args))

116

return list(map(*args))

117

118

119

def rangelist(*args):

119

def rangelist(*args):

120

return list(range(*args))

120

return list(range(*args))

121

122

123

def ziplist(*args):

123

def ziplist(*args):

124

return list(zip(*args))

124

return list(zip(*args))

125

126

127

rawinput = input

127

rawinput = input

128

getargspec = inspect.getfullargspec

128

getargspec = inspect.getfullargspec

129

130

long = int

130

long = int

131

132

if getattr(sys, 'argv', None) is not None:

132

if getattr(sys, 'argv', None) is not None:

133

# On POSIX, the char** argv array is converted to Python str using

133

# On POSIX, the char** argv array is converted to Python str using

134

# Py_DecodeLocale(). The inverse of this is Py_EncodeLocale(), which

134

# Py_DecodeLocale(). The inverse of this is Py_EncodeLocale(), which

135

# isn't directly callable from Python code. In practice, os.fsencode()

135

# isn't directly callable from Python code. In practice, os.fsencode()

136

# can be used instead (this is recommended by Python's documentation

136

# can be used instead (this is recommended by Python's documentation

137

# for sys.argv).

137

# for sys.argv).

138

#

138

#

139

# On Windows, the wchar_t **argv is passed into the interpreter as-is.

139

# On Windows, the wchar_t **argv is passed into the interpreter as-is.

140

# Like POSIX, we need to emulate what Py_EncodeLocale() would do. But

140

# Like POSIX, we need to emulate what Py_EncodeLocale() would do. But

141

# there's an additional wrinkle. What we really want to access is the

141

# there's an additional wrinkle. What we really want to access is the

142

# ANSI codepage representation of the arguments, as this is what

142

# ANSI codepage representation of the arguments, as this is what

143

# `int main()` would receive if Python 3 didn't define `int wmain()`

143

# `int main()` would receive if Python 3 didn't define `int wmain()`

144

# (this is how Python 2 worked). To get that, we encode with the mbcs

144

# (this is how Python 2 worked). To get that, we encode with the mbcs

145

# encoding, which will pass CP_ACP to the underlying Windows API to

145

# encoding, which will pass CP_ACP to the underlying Windows API to

146

# produce bytes.

146

# produce bytes.

147

if os.name == r'nt':

147

if os.name == r'nt':

148

sysargv = [a.encode("mbcs", "ignore") for a in sys.argv]

148

sysargv = [a.encode("mbcs", "ignore") for a in sys.argv]

149

else:

149

else:

150

sysargv = [fsencode(a) for a in sys.argv]

150

sysargv = [fsencode(a) for a in sys.argv]

151

152

bytechr = struct.Struct('>B').pack

152

bytechr = struct.Struct('>B').pack

153

byterepr = b'%r'.__mod__

153

byterepr = b'%r'.__mod__

154

155

156

class bytestr(bytes):

156

class bytestr(bytes):

157

"""A bytes which mostly acts as a Python 2 str

157

"""A bytes which mostly acts as a Python 2 str

158

159

>>> bytestr(), bytestr(bytearray(b'foo')), bytestr(u'ascii'), bytestr(1)

159

>>> bytestr(), bytestr(bytearray(b'foo')), bytestr(u'ascii'), bytestr(1)

160

('', 'foo', 'ascii', '1')

160

('', 'foo', 'ascii', '1')

161

>>> s = bytestr(b'foo')

161

>>> s = bytestr(b'foo')

162

>>> assert s is bytestr(s)

162

>>> assert s is bytestr(s)

163

164

__bytes__() should be called if provided:

164

__bytes__() should be called if provided:

165

166

>>> class bytesable:

166

>>> class bytesable:

167

... def __bytes__(self):

167

... def __bytes__(self):

168

... return b'bytes'

168

... return b'bytes'

169

>>> bytestr(bytesable())

169

>>> bytestr(bytesable())

170

'bytes'

170

'bytes'

171

172

There's no implicit conversion from non-ascii str as its encoding is

172

There's no implicit conversion from non-ascii str as its encoding is

173

unknown:

173

unknown:

174

175

>>> bytestr(chr(0x80)) # doctest: +ELLIPSIS

175

>>> bytestr(chr(0x80)) # doctest: +ELLIPSIS

176

Traceback (most recent call last):

176

Traceback (most recent call last):

177

...

177

...

178

UnicodeEncodeError: ...

178

UnicodeEncodeError: ...

179

180

Comparison between bytestr and bytes should work:

180

Comparison between bytestr and bytes should work:

181

182

>>> assert bytestr(b'foo') == b'foo'

182

>>> assert bytestr(b'foo') == b'foo'

183

>>> assert b'foo' == bytestr(b'foo')

183

>>> assert b'foo' == bytestr(b'foo')

184

>>> assert b'f' in bytestr(b'foo')

184

>>> assert b'f' in bytestr(b'foo')

185

>>> assert bytestr(b'f') in b'foo'

185

>>> assert bytestr(b'f') in b'foo'

186

187

Sliced elements should be bytes, not integer:

187

Sliced elements should be bytes, not integer:

188

189

>>> s[1], s[:2]

189

>>> s[1], s[:2]

190

(b'o', b'fo')

190

(b'o', b'fo')

191

>>> list(s), list(reversed(s))

191

>>> list(s), list(reversed(s))

192

([b'f', b'o', b'o'], [b'o', b'o', b'f'])

192

([b'f', b'o', b'o'], [b'o', b'o', b'f'])

193

194

As bytestr type isn't propagated across operations, you need to cast

194

As bytestr type isn't propagated across operations, you need to cast

195

bytes to bytestr explicitly:

195

bytes to bytestr explicitly:

196

197

>>> s = bytestr(b'foo').upper()

197

>>> s = bytestr(b'foo').upper()

198

>>> t = bytestr(s)

198

>>> t = bytestr(s)

199

>>> s[0], t[0]

199

>>> s[0], t[0]

200

(70, b'F')

200

(70, b'F')

201

202

Be careful to not pass a bytestr object to a function which expects

202

Be careful to not pass a bytestr object to a function which expects

203

bytearray-like behavior.

203

bytearray-like behavior.

204

205

>>> t = bytes(t) # cast to bytes

205

>>> t = bytes(t) # cast to bytes

206

>>> assert type(t) is bytes

206

>>> assert type(t) is bytes

207

"""

207

"""

208

209

# Trick pytype into not demanding Iterable[int] be passed to __new__(),

209

# Trick pytype into not demanding Iterable[int] be passed to __new__(),

210

# since the appropriate bytes format is done internally.

210

# since the appropriate bytes format is done internally.

211

#

211

#

212

# https://github.com/google/pytype/issues/500

212

# https://github.com/google/pytype/issues/500

213

if TYPE_CHECKING:

213

if TYPE_CHECKING:

214

215

def __init__(self, s=b''):

215

def __init__(self, s=b''):

216

pass

216

pass

217

218

def __new__(cls, s=b''):

218

def __new__(cls, s=b''):

219

if isinstance(s, bytestr):

219

if isinstance(s, bytestr):

220

return s

220

return s

221

if not isinstance(

221

if not isinstance(

222

s, (bytes, bytearray)

222

s, (bytes, bytearray)

223

) and not hasattr( # hasattr-py3-only

223

) and not hasattr( # hasattr-py3-only

224

s, u'__bytes__'

224

s, u'__bytes__'

225

):

225

):

226

s = str(s).encode('ascii')

226

s = str(s).encode('ascii')

227

return bytes.__new__(cls, s)

227

return bytes.__new__(cls, s)

228

229

def __getitem__(self, key):

229

def __getitem__(self, key):

230

s = bytes.__getitem__(self, key)

230

s = bytes.__getitem__(self, key)

231

if not isinstance(s, bytes):

231

if not isinstance(s, bytes):

232

s = bytechr(s)

232

s = bytechr(s)

233

return s

233

return s

234

235

def __iter__(self):

235

def __iter__(self):

236

return iterbytestr(bytes.__iter__(self))

236

return iterbytestr(bytes.__iter__(self))

237

238

def __repr__(self):

238

def __repr__(self):

239

return bytes.__repr__(self)[1:] # drop b''

239

return bytes.__repr__(self)[1:] # drop b''

240

241

242

def iterbytestr(s):

242

def iterbytestr(s):

243

"""Iterate bytes as if it were a str object of Python 2"""

243

"""Iterate bytes as if it were a str object of Python 2"""

244

return map(bytechr, s)

244

return map(bytechr, s)

245

246

247

def maybebytestr(s):

247

def maybebytestr(s):

248

"""Promote bytes to bytestr"""

248

"""Promote bytes to bytestr"""

249

if isinstance(s, bytes):

249

if isinstance(s, bytes):

250

return bytestr(s)

250

return bytestr(s)

251

return s

251

return s

252

253

254

def sysbytes(s):

254

def sysbytes(s):

255

"""Convert an internal str (e.g. keyword, __doc__) back to bytes

255

"""Convert an internal str (e.g. keyword, __doc__) back to bytes

256

257

This never raises UnicodeEncodeError, but only ASCII characters

257

This never raises UnicodeEncodeError, but only ASCII characters

258

can be round-trip by sysstr(sysbytes(s)).

258

can be round-trip by sysstr(sysbytes(s)).

259

"""

259

"""

260

if isinstance(s, bytes):

260

if isinstance(s, bytes):

261

return s

261

return s

262

return s.encode('utf-8')

262

return s.encode('utf-8')

263

264

265

def sysstr(s):

265

def sysstr(s):

266

"""Return a keyword str to be passed to Python functions such as

266

"""Return a keyword str to be passed to Python functions such as

267

getattr() and str.encode()

267

getattr() and str.encode()

268

269

This never raises UnicodeDecodeError. Non-ascii characters are

269

This never raises UnicodeDecodeError. Non-ascii characters are

270

considered invalid and mapped to arbitrary but unique code points

270

considered invalid and mapped to arbitrary but unique code points

271

such that 'sysstr(a) != sysstr(b)' for all 'a != b'.

271

such that 'sysstr(a) != sysstr(b)' for all 'a != b'.

272

"""

272

"""

273

if isinstance(s, builtins.str):

273

if isinstance(s, builtins.str):

274

return s

274

return s

275

return s.decode('latin-1')

275

return s.decode('latin-1')

276

277

278

def strurl(url):

278

def strurl(url):

279

"""Converts a bytes url back to str"""

279

"""Converts a bytes url back to str"""

280

if isinstance(url, bytes):

280

if isinstance(url, bytes):

281

return url.decode('ascii')

281

return url.decode('ascii')

282

return url

282

return url

283

284

285

def bytesurl(url):

285

def bytesurl(url):

286

"""Converts a str url to bytes by encoding in ascii"""

286

"""Converts a str url to bytes by encoding in ascii"""

287

if isinstance(url, str):

287

if isinstance(url, str):

288

return url.encode('ascii')

288

return url.encode('ascii')

289

return url

289

return url

290

291

292

def raisewithtb(exc, tb):

292

def raisewithtb(exc, tb):

293

"""Raise exception with the given traceback"""

293

"""Raise exception with the given traceback"""

294

raise exc.with_traceback(tb)

294

raise exc.with_traceback(tb)

295

296

297

def getdoc(obj):

297

def getdoc(obj):

298

"""Get docstring as bytes; may be None so gettext() won't confuse it

298

"""Get docstring as bytes; may be None so gettext() won't confuse it

299

with _('')"""

299

with _('')"""

300

doc = getattr(obj, '__doc__', None)

300

doc = getattr(obj, '__doc__', None)

301

if doc is None:

301

if doc is None:

302

return doc

302

return doc

303

return sysbytes(doc)

303

return sysbytes(doc)

304

305

306

def _wrapattrfunc(f):

306

def _wrapattrfunc(f):

307

@functools.wraps(f)

307

@functools.wraps(f)

308

def w(object, name, *args):

308

def w(object, name, *args):

309

return f(object, sysstr(name), *args)

309

return f(object, sysstr(name), *args)

310

311

return w

311

return w

312

313

314

# these wrappers are automagically imported by hgloader

314

# these wrappers are automagically imported by hgloader

315

delattr = _wrapattrfunc(builtins.delattr)

315

delattr = _wrapattrfunc(builtins.delattr)

316

getattr = _wrapattrfunc(builtins.getattr)

316

getattr = _wrapattrfunc(builtins.getattr)

317

hasattr = _wrapattrfunc(builtins.hasattr)

317

hasattr = _wrapattrfunc(builtins.hasattr)

318

setattr = _wrapattrfunc(builtins.setattr)

318

setattr = _wrapattrfunc(builtins.setattr)

319

xrange = builtins.range

319

xrange = builtins.range

320

unicode = str

320

unicode = str

321

322

323

def open(name, mode=b'r', buffering=-1, encoding=None):

323

def open(name, mode=b'r', buffering=-1, encoding=None):

324

return builtins.open(name, sysstr(mode), buffering, encoding)

324

return builtins.open(name, sysstr(mode), buffering, encoding)

325

326

327

safehasattr = _wrapattrfunc(builtins.hasattr)

327

safehasattr = _wrapattrfunc(builtins.hasattr)

328

329

330

def _getoptbwrapper(orig, args, shortlist, namelist):

330

def _getoptbwrapper(orig, args, shortlist, namelist):

331

"""

331

"""

332

Takes bytes arguments, converts them to unicode, pass them to

332

Takes bytes arguments, converts them to unicode, pass them to

333

getopt.getopt(), convert the returned values back to bytes and then

333

getopt.getopt(), convert the returned values back to bytes and then

334

return them for Python 3 compatibility as getopt.getopt() don't accepts

334

return them for Python 3 compatibility as getopt.getopt() don't accepts

335

bytes on Python 3.

335

bytes on Python 3.

336

"""

336

"""

337

args = [a.decode('latin-1') for a in args]

337

args = [a.decode('latin-1') for a in args]

338

shortlist = shortlist.decode('latin-1')

338

shortlist = shortlist.decode('latin-1')

339

namelist = [a.decode('latin-1') for a in namelist]

339

namelist = [a.decode('latin-1') for a in namelist]

340

opts, args = orig(args, shortlist, namelist)

340

opts, args = orig(args, shortlist, namelist)

341

opts = [(a[0].encode('latin-1'), a[1].encode('latin-1')) for a in opts]

341

opts = [(a[0].encode('latin-1'), a[1].encode('latin-1')) for a in opts]

342

args = [a.encode('latin-1') for a in args]

342

args = [a.encode('latin-1') for a in args]

343

return opts, args

343

return opts, args

344

345

346

def strkwargs(dic):

346

def strkwargs(dic):

347

"""

347

"""

348

Converts the keys of a python dictonary to str i.e. unicodes so that

348

Converts the keys of a python dictonary to str i.e. unicodes so that

349

they can be passed as keyword arguments as dictionaries with bytes keys

349

they can be passed as keyword arguments as dictionaries with bytes keys

350

can't be passed as keyword arguments to functions on Python 3.

350

can't be passed as keyword arguments to functions on Python 3.

351

"""

351

"""

352

dic = {k.decode('latin-1'): v for k, v in dic.items()}

352

dic = {k.decode('latin-1'): v for k, v in dic.items()}

353

return dic

353

return dic

354

355

356

def byteskwargs(dic):

356

def byteskwargs(dic):

357

"""

357

"""

358

Converts keys of python dictionaries to bytes as they were converted to

358

Converts keys of python dictionaries to bytes as they were converted to

359

str to pass that dictonary as a keyword argument on Python 3.

359

str to pass that dictonary as a keyword argument on Python 3.

360

"""

360

"""

361

dic = {k.encode('latin-1'): v for k, v in dic.items()}

361

dic = {k.encode('latin-1'): v for k, v in dic.items()}

362

return dic

362

return dic

363

364

365

# TODO: handle shlex.shlex().

365

# TODO: handle shlex.shlex().

366

def shlexsplit(s, comments=False, posix=True):

366

def shlexsplit(s, comments=False, posix=True):

367

"""

367

"""

368

Takes bytes argument, convert it to str i.e. unicodes, pass that into

368

Takes bytes argument, convert it to str i.e. unicodes, pass that into

369

shlex.split(), convert the returned value to bytes and return that for

369

shlex.split(), convert the returned value to bytes and return that for

370

Python 3 compatibility as shelx.split() don't accept bytes on Python 3.

370

Python 3 compatibility as shelx.split() don't accept bytes on Python 3.

371

"""

371

"""

372

ret = shlex.split(s.decode('latin-1'), comments, posix)

372

ret = shlex.split(s.decode('latin-1'), comments, posix)

373

return [a.encode('latin-1') for a in ret]

373

return [a.encode('latin-1') for a in ret]

374

375

376

iteritems = lambda x: x.items()

376

iteritems = lambda x: x.items()

377

itervalues = lambda x: x.values()

377

itervalues = lambda x: x.values()

378

379

# Python 3.5's json.load and json.loads require str. We polyfill its

379

# Python 3.5's json.load and json.loads require str. We polyfill its

380

# code for detecting encoding from bytes.

380

# code for detecting encoding from bytes.

381

if sys.version_info[0:2] < (3, 6):

381

if sys.version_info[0:2] < (3, 6):

382

383

def _detect_encoding(b):

383

def _detect_encoding(b):

384

bstartswith = b.startswith

384

bstartswith = b.startswith

385

if bstartswith((codecs.BOM_UTF32_BE, codecs.BOM_UTF32_LE)):

385

if bstartswith((codecs.BOM_UTF32_BE, codecs.BOM_UTF32_LE)):

386

return 'utf-32'

386

return 'utf-32'

387

if bstartswith((codecs.BOM_UTF16_BE, codecs.BOM_UTF16_LE)):

387

if bstartswith((codecs.BOM_UTF16_BE, codecs.BOM_UTF16_LE)):

388

return 'utf-16'

388

return 'utf-16'

389

if bstartswith(codecs.BOM_UTF8):

389

if bstartswith(codecs.BOM_UTF8):

390

return 'utf-8-sig'

390

return 'utf-8-sig'

391

392

if len(b) >= 4:

392

if len(b) >= 4:

393

if not b[0]:

393

if not b[0]:

394

# 00 00 -- -- - utf-32-be

394

# 00 00 -- -- - utf-32-be

395

# 00 XX -- -- - utf-16-be

395

# 00 XX -- -- - utf-16-be

396

return 'utf-16-be' if b[1] else 'utf-32-be'

396

return 'utf-16-be' if b[1] else 'utf-32-be'

397

if not b[1]:

397

if not b[1]:

398

# XX 00 00 00 - utf-32-le

398

# XX 00 00 00 - utf-32-le

399

# XX 00 00 XX - utf-16-le

399

# XX 00 00 XX - utf-16-le

400

# XX 00 XX -- - utf-16-le

400

# XX 00 XX -- - utf-16-le

401

return 'utf-16-le' if b[2] or b[3] else 'utf-32-le'

401

return 'utf-16-le' if b[2] or b[3] else 'utf-32-le'

402

elif len(b) == 2:

402

elif len(b) == 2:

403

if not b[0]:

403

if not b[0]:

404

# 00 XX - utf-16-be

404

# 00 XX - utf-16-be

405

return 'utf-16-be'

405

return 'utf-16-be'

406

if not b[1]:

406

if not b[1]:

407

# XX 00 - utf-16-le

407

# XX 00 - utf-16-le

408

return 'utf-16-le'

408

return 'utf-16-le'

409

# default

409

# default

410

return 'utf-8'

410

return 'utf-8'

411

412

def json_loads(s, *args, **kwargs):

412

def json_loads(s, *args, **kwargs):

413

if isinstance(s, (bytes, bytearray)):

413

if isinstance(s, (bytes, bytearray)):

414

s = s.decode(_detect_encoding(s), 'surrogatepass')

414

s = s.decode(_detect_encoding(s), 'surrogatepass')

415

416

return json.loads(s, *args, **kwargs)

416

return json.loads(s, *args, **kwargs)

417

418

419

else:

418

else:

420

json_loads = json.loads

419

json_loads = json.loads

421

420

422

isjython = sysplatform.startswith(b'java')

421

isjython = sysplatform.startswith(b'java')

423

422

424

isdarwin = sysplatform.startswith(b'darwin')

423

isdarwin = sysplatform.startswith(b'darwin')

425

islinux = sysplatform.startswith(b'linux')

424

islinux = sysplatform.startswith(b'linux')

426

isposix = osname == b'posix'

425

isposix = osname == b'posix'

427

iswindows = osname == b'nt'

426

iswindows = osname == b'nt'

428

427

429

428

430

def getoptb(args, shortlist, namelist):

429

def getoptb(args, shortlist, namelist):

431

return _getoptbwrapper(getopt.getopt, args, shortlist, namelist)

430

return _getoptbwrapper(getopt.getopt, args, shortlist, namelist)

432

431

433

432

434

def gnugetoptb(args, shortlist, namelist):

433

def gnugetoptb(args, shortlist, namelist):

435

return _getoptbwrapper(getopt.gnu_getopt, args, shortlist, namelist)

434

return _getoptbwrapper(getopt.gnu_getopt, args, shortlist, namelist)

436

435

437

436

438

def mkdtemp(suffix=b'', prefix=b'tmp', dir=None):

437

def mkdtemp(suffix=b'', prefix=b'tmp', dir=None):

439

return tempfile.mkdtemp(suffix, prefix, dir)

438

return tempfile.mkdtemp(suffix, prefix, dir)

440

439

441

440

442

# text=True is not supported; use util.from/tonativeeol() instead

441

# text=True is not supported; use util.from/tonativeeol() instead

443

def mkstemp(suffix=b'', prefix=b'tmp', dir=None):

442

def mkstemp(suffix=b'', prefix=b'tmp', dir=None):

444

return tempfile.mkstemp(suffix, prefix, dir)

443

return tempfile.mkstemp(suffix, prefix, dir)

445

444

446

445

447

# TemporaryFile does not support an "encoding=" argument on python2.

446

# TemporaryFile does not support an "encoding=" argument on python2.

448

# This wrapper file are always open in byte mode.

447

# This wrapper file are always open in byte mode.

449

def unnamedtempfile(mode=None, *args, **kwargs):

448

def unnamedtempfile(mode=None, *args, **kwargs):

450

if mode is None:

449

if mode is None:

451

mode = 'w+b'

450

mode = 'w+b'

452

else:

451

else:

453

mode = sysstr(mode)

452

mode = sysstr(mode)

454

assert 'b' in mode

453

assert 'b' in mode

455

return tempfile.TemporaryFile(mode, *args, **kwargs)

454

return tempfile.TemporaryFile(mode, *args, **kwargs)

456

455

457

456

458

# NamedTemporaryFile does not support an "encoding=" argument on python2.

457

# NamedTemporaryFile does not support an "encoding=" argument on python2.

459

# This wrapper file are always open in byte mode.

458

# This wrapper file are always open in byte mode.

460

def namedtempfile(

459

def namedtempfile(

461

mode=b'w+b', bufsize=-1, suffix=b'', prefix=b'tmp', dir=None, delete=True

460

mode=b'w+b', bufsize=-1, suffix=b'', prefix=b'tmp', dir=None, delete=True

462

):

461

):

463

mode = sysstr(mode)

462

mode = sysstr(mode)

464

assert 'b' in mode

463

assert 'b' in mode

465

return tempfile.NamedTemporaryFile(

464

return tempfile.NamedTemporaryFile(

466

mode, bufsize, suffix=suffix, prefix=prefix, dir=dir, delete=delete

465

mode, bufsize, suffix=suffix, prefix=prefix, dir=dir, delete=delete

467

)

466

)

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages

             # pycompat.py - portability shim for python 3
             #
             # This software may be used and distributed according to the terms of the
             # GNU General Public License version 2 or any later version.
             """Mercurial portability shim for python 3.
             This contains aliases to hide python version-specific details from the core.
             """
             import builtins
             import codecs
             import concurrent.futures as futures
             import functools
             import getopt
             import http.client as httplib
             import http.cookiejar as cookielib
             import inspect
             import io
             import json
             import os
             import pickle
             import queue
             import shlex
             import socketserver
             import struct
             import sys
             import tempfile
             import xmlrpc.client as xmlrpclib
             ispy3 = sys.version_info[0] >= 3
             ispypy = '__pypy__' in sys.builtin_module_names
             TYPE_CHECKING = False
             if not globals():  # hide this from non-pytype users
                 import typing
                 TYPE_CHECKING = typing.TYPE_CHECKING
             def future_set_exception_info(f, exc_info):
                 f.set_exception(exc_info[0])
             FileNotFoundError = builtins.FileNotFoundError
             def identity(a):
                 return a
             def _rapply(f, xs):
                 if xs is None:
                     # assume None means non-value of optional data
                     return xs
                 if isinstance(xs, (list, set, tuple)):
                     return type(xs)(_rapply(f, x) for x in xs)
                 if isinstance(xs, dict):
                     return type(xs)((_rapply(f, k), _rapply(f, v)) for k, v in xs.items())
                 return f(xs)
             def rapply(f, xs):
                 """Apply function recursively to every item preserving the data structure
                 >>> def f(x):
                 ...     return 'f(%s)' % x
                 >>> rapply(f, None) is None
                 True
                 >>> rapply(f, 'a')
                 'f(a)'
                 >>> rapply(f, {'a'}) == {'f(a)'}
                 True
                 >>> rapply(f, ['a', 'b', None, {'c': 'd'}, []])
                 ['f(a)', 'f(b)', None, {'f(c)': 'f(d)'}, []]
                 >>> xs = [object()]
                 >>> rapply(identity, xs) is xs
                 True
                 """
                 if f is identity:
                     # fast path mainly for py2
                     return xs
                 return _rapply(f, xs)
-            if os.name == r'nt' and sys.version_info >= (3, 6):
+            if os.name == r'nt':
                 # MBCS (or ANSI) filesystem encoding must be used as before.
                 # Otherwise non-ASCII filenames in existing repositories would be
                 # corrupted.
                 # This must be set once prior to any fsencode/fsdecode calls.
                 sys._enablelegacywindowsfsencoding()  # pytype: disable=module-attr
             fsencode = os.fsencode
             fsdecode = os.fsdecode
             oscurdir = os.curdir.encode('ascii')
             oslinesep = os.linesep.encode('ascii')
             osname = os.name.encode('ascii')
             ospathsep = os.pathsep.encode('ascii')
             ospardir = os.pardir.encode('ascii')
             ossep = os.sep.encode('ascii')
             osaltsep = os.altsep
             if osaltsep:
                 osaltsep = osaltsep.encode('ascii')
             osdevnull = os.devnull.encode('ascii')
             sysplatform = sys.platform.encode('ascii')
             sysexecutable = sys.executable
             if sysexecutable:
                 sysexecutable = os.fsencode(sysexecutable)
             def maplist(*args):
                 return list(map(*args))
             def rangelist(*args):
                 return list(range(*args))
             def ziplist(*args):
                 return list(zip(*args))
             rawinput = input
             getargspec = inspect.getfullargspec
             long = int
             if getattr(sys, 'argv', None) is not None:
                 # On POSIX, the char** argv array is converted to Python str using
                 # Py_DecodeLocale(). The inverse of this is Py_EncodeLocale(), which
                 # isn't directly callable from Python code. In practice, os.fsencode()
                 # can be used instead (this is recommended by Python's documentation
                 # for sys.argv).
                 #
                 # On Windows, the wchar_t **argv is passed into the interpreter as-is.
                 # Like POSIX, we need to emulate what Py_EncodeLocale() would do. But
                 # there's an additional wrinkle. What we really want to access is the
                 # ANSI codepage representation of the arguments, as this is what
                 # `int main()` would receive if Python 3 didn't define `int wmain()`
                 # (this is how Python 2 worked). To get that, we encode with the mbcs
                 # encoding, which will pass CP_ACP to the underlying Windows API to
                 # produce bytes.
                 if os.name == r'nt':
                     sysargv = [a.encode("mbcs", "ignore") for a in sys.argv]
                 else:
                     sysargv = [fsencode(a) for a in sys.argv]
             bytechr = struct.Struct('>B').pack
             byterepr = b'%r'.__mod__
             class bytestr(bytes):
                 """A bytes which mostly acts as a Python 2 str
                 >>> bytestr(), bytestr(bytearray(b'foo')), bytestr(u'ascii'), bytestr(1)
                 ('', 'foo', 'ascii', '1')
                 >>> s = bytestr(b'foo')
                 >>> assert s is bytestr(s)
                 __bytes__() should be called if provided:
                 >>> class bytesable:
                 ...     def __bytes__(self):
                 ...         return b'bytes'
                 >>> bytestr(bytesable())
                 'bytes'
                 There's no implicit conversion from non-ascii str as its encoding is
                 unknown:
                 >>> bytestr(chr(0x80)) # doctest: +ELLIPSIS
                 Traceback (most recent call last):
                   ...
                 UnicodeEncodeError: ...
                 Comparison between bytestr and bytes should work:
                 >>> assert bytestr(b'foo') == b'foo'
                 >>> assert b'foo' == bytestr(b'foo')
                 >>> assert b'f' in bytestr(b'foo')
                 >>> assert bytestr(b'f') in b'foo'
                 Sliced elements should be bytes, not integer:
                 >>> s[1], s[:2]
                 (b'o', b'fo')
                 >>> list(s), list(reversed(s))
                 ([b'f', b'o', b'o'], [b'o', b'o', b'f'])
                 As bytestr type isn't propagated across operations, you need to cast
                 bytes to bytestr explicitly:
                 >>> s = bytestr(b'foo').upper()
                 >>> t = bytestr(s)
                 >>> s[0], t[0]
                 (70, b'F')
                 Be careful to not pass a bytestr object to a function which expects
                 bytearray-like behavior.
                 >>> t = bytes(t)  # cast to bytes
                 >>> assert type(t) is bytes
                 """
                 # Trick pytype into not demanding Iterable[int] be passed to __new__(),
                 # since the appropriate bytes format is done internally.
                 #
                 # https://github.com/google/pytype/issues/500
                 if TYPE_CHECKING:
                     def __init__(self, s=b''):
                         pass
                 def __new__(cls, s=b''):
                     if isinstance(s, bytestr):
                         return s
                     if not isinstance(
                         s, (bytes, bytearray)
                     ) and not hasattr(  # hasattr-py3-only
                         s, u'__bytes__'
                     ):
                         s = str(s).encode('ascii')
                     return bytes.__new__(cls, s)
                 def __getitem__(self, key):
                     s = bytes.__getitem__(self, key)
                     if not isinstance(s, bytes):
                         s = bytechr(s)
                     return s
                 def __iter__(self):
                     return iterbytestr(bytes.__iter__(self))
                 def __repr__(self):
                     return bytes.__repr__(self)[1:]  # drop b''
             def iterbytestr(s):
                 """Iterate bytes as if it were a str object of Python 2"""
                 return map(bytechr, s)
             def maybebytestr(s):
                 """Promote bytes to bytestr"""
                 if isinstance(s, bytes):
                     return bytestr(s)
                 return s
             def sysbytes(s):
                 """Convert an internal str (e.g. keyword, __doc__) back to bytes
                 This never raises UnicodeEncodeError, but only ASCII characters
                 can be round-trip by sysstr(sysbytes(s)).
                 """
                 if isinstance(s, bytes):
                     return s
                 return s.encode('utf-8')
             def sysstr(s):
                 """Return a keyword str to be passed to Python functions such as
                 getattr() and str.encode()
                 This never raises UnicodeDecodeError. Non-ascii characters are
                 considered invalid and mapped to arbitrary but unique code points
                 such that 'sysstr(a) != sysstr(b)' for all 'a != b'.
                 """
                 if isinstance(s, builtins.str):
                     return s
                 return s.decode('latin-1')
             def strurl(url):
                 """Converts a bytes url back to str"""
                 if isinstance(url, bytes):
                     return url.decode('ascii')
                 return url
             def bytesurl(url):
                 """Converts a str url to bytes by encoding in ascii"""
                 if isinstance(url, str):
                     return url.encode('ascii')
                 return url
             def raisewithtb(exc, tb):
                 """Raise exception with the given traceback"""
                 raise exc.with_traceback(tb)
             def getdoc(obj):
                 """Get docstring as bytes; may be None so gettext() won't confuse it
                 with _('')"""
                 doc = getattr(obj, '__doc__', None)
                 if doc is None:
                     return doc
                 return sysbytes(doc)
             def _wrapattrfunc(f):
                 @functools.wraps(f)
                 def w(object, name, *args):
                     return f(object, sysstr(name), *args)
                 return w
             # these wrappers are automagically imported by hgloader
             delattr = _wrapattrfunc(builtins.delattr)
             getattr = _wrapattrfunc(builtins.getattr)
             hasattr = _wrapattrfunc(builtins.hasattr)
             setattr = _wrapattrfunc(builtins.setattr)
             xrange = builtins.range
             unicode = str
             def open(name, mode=b'r', buffering=-1, encoding=None):
                 return builtins.open(name, sysstr(mode), buffering, encoding)
             safehasattr = _wrapattrfunc(builtins.hasattr)
             def _getoptbwrapper(orig, args, shortlist, namelist):
                 """
                 Takes bytes arguments, converts them to unicode, pass them to
                 getopt.getopt(), convert the returned values back to bytes and then
                 return them for Python 3 compatibility as getopt.getopt() don't accepts
                 bytes on Python 3.
                 """
                 args = [a.decode('latin-1') for a in args]
                 shortlist = shortlist.decode('latin-1')
                 namelist = [a.decode('latin-1') for a in namelist]
                 opts, args = orig(args, shortlist, namelist)
                 opts = [(a[0].encode('latin-1'), a[1].encode('latin-1')) for a in opts]
                 args = [a.encode('latin-1') for a in args]
                 return opts, args
             def strkwargs(dic):
                 """
                 Converts the keys of a python dictonary to str i.e. unicodes so that
                 they can be passed as keyword arguments as dictionaries with bytes keys
                 can't be passed as keyword arguments to functions on Python 3.
                 """
                 dic = {k.decode('latin-1'): v for k, v in dic.items()}
                 return dic
             def byteskwargs(dic):
                 """
                 Converts keys of python dictionaries to bytes as they were converted to
                 str to pass that dictonary as a keyword argument on Python 3.
                 """
                 dic = {k.encode('latin-1'): v for k, v in dic.items()}
                 return dic
             # TODO: handle shlex.shlex().
             def shlexsplit(s, comments=False, posix=True):
                 """
                 Takes bytes argument, convert it to str i.e. unicodes, pass that into
                 shlex.split(), convert the returned value to bytes and return that for
                 Python 3 compatibility as shelx.split() don't accept bytes on Python 3.
                 """
                 ret = shlex.split(s.decode('latin-1'), comments, posix)
                 return [a.encode('latin-1') for a in ret]
             iteritems = lambda x: x.items()
             itervalues = lambda x: x.values()
             # Python 3.5's json.load and json.loads require str. We polyfill its
             # code for detecting encoding from bytes.
             if sys.version_info[0:2] < (3, 6):
                 def _detect_encoding(b):
                     bstartswith = b.startswith
                     if bstartswith((codecs.BOM_UTF32_BE, codecs.BOM_UTF32_LE)):
                         return 'utf-32'
                     if bstartswith((codecs.BOM_UTF16_BE, codecs.BOM_UTF16_LE)):
                         return 'utf-16'
                     if bstartswith(codecs.BOM_UTF8):
                         return 'utf-8-sig'
                     if len(b) >= 4:
                         if not b[0]:
                             # 00 00 -- -- - utf-32-be
                             # 00 XX -- -- - utf-16-be
                             return 'utf-16-be' if b[1] else 'utf-32-be'
                         if not b[1]:
                             # XX 00 00 00 - utf-32-le
                             # XX 00 00 XX - utf-16-le
                             # XX 00 XX -- - utf-16-le
                             return 'utf-16-le' if b[2] or b[3] else 'utf-32-le'
                     elif len(b) == 2:
                         if not b[0]:
                             # 00 XX - utf-16-be
                             return 'utf-16-be'
                         if not b[1]:
                             # XX 00 - utf-16-le
                             return 'utf-16-le'
                     # default
                     return 'utf-8'
                 def json_loads(s, *args, **kwargs):
                     if isinstance(s, (bytes, bytearray)):
                         s = s.decode(_detect_encoding(s), 'surrogatepass')
                     return json.loads(s, *args, **kwargs)
             else:
                 json_loads = json.loads
             isjython = sysplatform.startswith(b'java')
             isdarwin = sysplatform.startswith(b'darwin')
             islinux = sysplatform.startswith(b'linux')
             isposix = osname == b'posix'
             iswindows = osname == b'nt'
             def getoptb(args, shortlist, namelist):
                 return _getoptbwrapper(getopt.getopt, args, shortlist, namelist)
             def gnugetoptb(args, shortlist, namelist):
                 return _getoptbwrapper(getopt.gnu_getopt, args, shortlist, namelist)
             def mkdtemp(suffix=b'', prefix=b'tmp', dir=None):
                 return tempfile.mkdtemp(suffix, prefix, dir)
             # text=True is not supported; use util.from/tonativeeol() instead
             def mkstemp(suffix=b'', prefix=b'tmp', dir=None):
                 return tempfile.mkstemp(suffix, prefix, dir)
             # TemporaryFile does not support an "encoding=" argument on python2.
             # This wrapper file are always open in byte mode.
             def unnamedtempfile(mode=None, *args, **kwargs):
                 if mode is None:
                     mode = 'w+b'
                 else:
                     mode = sysstr(mode)
                 assert 'b' in mode
                 return tempfile.TemporaryFile(mode, *args, **kwargs)
             # NamedTemporaryFile does not support an "encoding=" argument on python2.
             # This wrapper file are always open in byte mode.
             def namedtempfile(
                 mode=b'w+b', bufsize=-1, suffix=b'', prefix=b'tmp', dir=None, delete=True
             ):
                 mode = sysstr(mode)
                 assert 'b' in mode
                 return tempfile.NamedTemporaryFile(
                     mode, bufsize, suffix=suffix, prefix=prefix, dir=dir, delete=delete
                 )