pycompat.py
449 lines
| 13.6 KiB
| text/x-python
|
PythonLexer
/ mercurial / pycompat.py
timeless
|
r28818 | # pycompat.py - portability shim for python 3 | ||
# | ||||
# This software may be used and distributed according to the terms of the | ||||
# GNU General Public License version 2 or any later version. | ||||
"""Mercurial portability shim for python 3. | ||||
This contains aliases to hide python version-specific details from the core. | ||||
""" | ||||
from __future__ import absolute_import | ||||
Pulkit Goyal
|
r30578 | import getopt | ||
Augie Fackler
|
r36196 | import inspect | ||
Pulkit Goyal
|
r30302 | import os | ||
Pulkit Goyal
|
r30678 | import shlex | ||
Pulkit Goyal
|
r29584 | import sys | ||
Yuya Nishihara
|
r38182 | import tempfile | ||
Pulkit Goyal
|
r29584 | |||
Yuya Nishihara
|
r30030 | ispy3 = (sys.version_info[0] >= 3) | ||
Yuya Nishihara
|
r33628 | ispypy = (r'__pypy__' in sys.builtin_module_names) | ||
Yuya Nishihara
|
r30030 | |||
if not ispy3: | ||||
Gregory Szorc
|
r31934 | import cookielib | ||
Pulkit Goyal
|
r29324 | import cPickle as pickle | ||
Pulkit Goyal
|
r29455 | import httplib | ||
Gregory Szorc
|
r37863 | import Queue as queue | ||
Pulkit Goyal
|
r29433 | import SocketServer as socketserver | ||
Pulkit Goyal
|
r29432 | import xmlrpclib | ||
Gregory Szorc
|
r37646 | |||
from .thirdparty.concurrent import futures | ||||
Augie Fackler
|
r37687 | |||
def future_set_exception_info(f, exc_info): | ||||
f.set_exception_info(*exc_info) | ||||
Pulkit Goyal
|
r29584 | else: | ||
Gregory Szorc
|
r37646 | import concurrent.futures as futures | ||
Gregory Szorc
|
r31942 | import http.cookiejar as cookielib | ||
Pulkit Goyal
|
r29584 | import http.client as httplib | ||
import pickle | ||||
Gregory Szorc
|
r37863 | import queue as queue | ||
Pulkit Goyal
|
r29584 | import socketserver | ||
Pulkit Goyal
|
r29432 | import xmlrpc.client as xmlrpclib | ||
Pulkit Goyal
|
r29431 | |||
Augie Fackler
|
r37687 | def future_set_exception_info(f, exc_info): | ||
f.set_exception(exc_info[0]) | ||||
Yuya Nishihara
|
r31774 | def identity(a): | ||
return a | ||||
Yuya Nishihara
|
r38594 | def _rapply(f, xs): | ||
if xs is None: | ||||
# assume None means non-value of optional data | ||||
return xs | ||||
if isinstance(xs, (list, set, tuple)): | ||||
return type(xs)(_rapply(f, x) for x in xs) | ||||
if isinstance(xs, dict): | ||||
return type(xs)((_rapply(f, k), _rapply(f, v)) for k, v in xs.items()) | ||||
return f(xs) | ||||
def rapply(f, xs): | ||||
"""Apply function recursively to every item preserving the data structure | ||||
>>> def f(x): | ||||
... return 'f(%s)' % x | ||||
>>> rapply(f, None) is None | ||||
True | ||||
>>> rapply(f, 'a') | ||||
'f(a)' | ||||
>>> rapply(f, {'a'}) == {'f(a)'} | ||||
True | ||||
>>> rapply(f, ['a', 'b', None, {'c': 'd'}, []]) | ||||
['f(a)', 'f(b)', None, {'f(c)': 'f(d)'}, []] | ||||
>>> xs = [object()] | ||||
>>> rapply(identity, xs) is xs | ||||
True | ||||
""" | ||||
if f is identity: | ||||
# fast path mainly for py2 | ||||
return xs | ||||
return _rapply(f, xs) | ||||
Yuya Nishihara
|
r30030 | if ispy3: | ||
Yuya Nishihara
|
r29797 | import builtins | ||
Yuya Nishihara
|
r29799 | import functools | ||
Yuya Nishihara
|
r31372 | import io | ||
Martin von Zweigbergk
|
r31424 | import struct | ||
Yuya Nishihara
|
r31372 | |||
Martijn Pieters
|
r30119 | fsencode = os.fsencode | ||
Pulkit Goyal
|
r30300 | fsdecode = os.fsdecode | ||
Yuya Nishihara
|
r36666 | oscurdir = os.curdir.encode('ascii') | ||
Yuya Nishihara
|
r31775 | oslinesep = os.linesep.encode('ascii') | ||
Pulkit Goyal
|
r30302 | osname = os.name.encode('ascii') | ||
Pulkit Goyal
|
r30303 | ospathsep = os.pathsep.encode('ascii') | ||
Yuya Nishihara
|
r36665 | ospardir = os.pardir.encode('ascii') | ||
Pulkit Goyal
|
r30303 | ossep = os.sep.encode('ascii') | ||
Pulkit Goyal
|
r30623 | osaltsep = os.altsep | ||
if osaltsep: | ||||
osaltsep = osaltsep.encode('ascii') | ||||
Pulkit Goyal
|
r30500 | # os.getcwd() on Python 3 returns string, but it has os.getcwdb() which | ||
# returns bytes. | ||||
getcwd = os.getcwdb | ||||
Pulkit Goyal
|
r30624 | sysplatform = sys.platform.encode('ascii') | ||
Pulkit Goyal
|
r30668 | sysexecutable = sys.executable | ||
if sysexecutable: | ||||
sysexecutable = os.fsencode(sysexecutable) | ||||
Gregory Szorc
|
r36976 | bytesio = io.BytesIO | ||
# TODO deprecate stringio name, as it is a lie on Python 3. | ||||
stringio = bytesio | ||||
Yuya Nishihara
|
r36952 | |||
def maplist(*args): | ||||
return list(map(*args)) | ||||
Yuya Nishihara
|
r37082 | def rangelist(*args): | ||
return list(range(*args)) | ||||
Yuya Nishihara
|
r36952 | def ziplist(*args): | ||
return list(zip(*args)) | ||||
Yuya Nishihara
|
r33853 | rawinput = input | ||
Augie Fackler
|
r36196 | getargspec = inspect.getfullargspec | ||
Yuya Nishihara
|
r30334 | |||
Yuya Nishihara
|
r30472 | # TODO: .buffer might not exist if std streams were replaced; we'll need | ||
# a silly wrapper to make a bytes stream backed by a unicode one. | ||||
stdin = sys.stdin.buffer | ||||
stdout = sys.stdout.buffer | ||||
stderr = sys.stderr.buffer | ||||
Yuya Nishihara
|
r30334 | # Since Python 3 converts argv to wchar_t type by Py_DecodeLocale() on Unix, | ||
# we can use os.fsencode() to get back bytes argv. | ||||
# | ||||
# https://hg.python.org/cpython/file/v3.5.1/Programs/python.c#l55 | ||||
# | ||||
# TODO: On Windows, the native argv is wchar_t, so we'll need a different | ||||
# workaround to simulate the Python 2 (i.e. ANSI Win32 API) behavior. | ||||
Augie Fackler
|
r31277 | if getattr(sys, 'argv', None) is not None: | ||
sysargv = list(map(os.fsencode, sys.argv)) | ||||
Yuya Nishihara
|
r29797 | |||
Martin von Zweigbergk
|
r31424 | bytechr = struct.Struct('>B').pack | ||
Yuya Nishihara
|
r36279 | byterepr = b'%r'.__mod__ | ||
Yuya Nishihara
|
r31253 | |||
Yuya Nishihara
|
r31439 | class bytestr(bytes): | ||
"""A bytes which mostly acts as a Python 2 str | ||||
>>> bytestr(), bytestr(bytearray(b'foo')), bytestr(u'ascii'), bytestr(1) | ||||
Yuya Nishihara
|
r35921 | ('', 'foo', 'ascii', '1') | ||
Yuya Nishihara
|
r31439 | >>> s = bytestr(b'foo') | ||
>>> assert s is bytestr(s) | ||||
Yuya Nishihara
|
r32450 | __bytes__() should be called if provided: | ||
>>> class bytesable(object): | ||||
... def __bytes__(self): | ||||
... return b'bytes' | ||||
>>> bytestr(bytesable()) | ||||
Yuya Nishihara
|
r35921 | 'bytes' | ||
Yuya Nishihara
|
r32450 | |||
Yuya Nishihara
|
r31439 | There's no implicit conversion from non-ascii str as its encoding is | ||
unknown: | ||||
>>> bytestr(chr(0x80)) # doctest: +ELLIPSIS | ||||
Traceback (most recent call last): | ||||
... | ||||
UnicodeEncodeError: ... | ||||
Comparison between bytestr and bytes should work: | ||||
>>> assert bytestr(b'foo') == b'foo' | ||||
>>> assert b'foo' == bytestr(b'foo') | ||||
>>> assert b'f' in bytestr(b'foo') | ||||
>>> assert bytestr(b'f') in b'foo' | ||||
Sliced elements should be bytes, not integer: | ||||
>>> s[1], s[:2] | ||||
(b'o', b'fo') | ||||
>>> list(s), list(reversed(s)) | ||||
([b'f', b'o', b'o'], [b'o', b'o', b'f']) | ||||
As bytestr type isn't propagated across operations, you need to cast | ||||
bytes to bytestr explicitly: | ||||
>>> s = bytestr(b'foo').upper() | ||||
>>> t = bytestr(s) | ||||
>>> s[0], t[0] | ||||
(70, b'F') | ||||
Be careful to not pass a bytestr object to a function which expects | ||||
bytearray-like behavior. | ||||
>>> t = bytes(t) # cast to bytes | ||||
>>> assert type(t) is bytes | ||||
""" | ||||
def __new__(cls, s=b''): | ||||
if isinstance(s, bytestr): | ||||
return s | ||||
Yuya Nishihara
|
r32450 | if (not isinstance(s, (bytes, bytearray)) | ||
and not hasattr(s, u'__bytes__')): # hasattr-py3-only | ||||
Yuya Nishihara
|
r31439 | s = str(s).encode(u'ascii') | ||
return bytes.__new__(cls, s) | ||||
def __getitem__(self, key): | ||||
s = bytes.__getitem__(self, key) | ||||
if not isinstance(s, bytes): | ||||
s = bytechr(s) | ||||
return s | ||||
def __iter__(self): | ||||
return iterbytestr(bytes.__iter__(self)) | ||||
Yuya Nishihara
|
r35921 | def __repr__(self): | ||
return bytes.__repr__(self)[1:] # drop b'' | ||||
Yuya Nishihara
|
r31382 | def iterbytestr(s): | ||
"""Iterate bytes as if it were a str object of Python 2""" | ||||
Martin von Zweigbergk
|
r31425 | return map(bytechr, s) | ||
Yuya Nishihara
|
r31382 | |||
Yuya Nishihara
|
r35922 | def maybebytestr(s): | ||
"""Promote bytes to bytestr""" | ||||
if isinstance(s, bytes): | ||||
return bytestr(s) | ||||
return s | ||||
Yuya Nishihara
|
r31820 | def sysbytes(s): | ||
"""Convert an internal str (e.g. keyword, __doc__) back to bytes | ||||
This never raises UnicodeEncodeError, but only ASCII characters | ||||
can be round-trip by sysstr(sysbytes(s)). | ||||
""" | ||||
return s.encode(u'utf-8') | ||||
Yuya Nishihara
|
r30032 | def sysstr(s): | ||
"""Return a keyword str to be passed to Python functions such as | ||||
getattr() and str.encode() | ||||
This never raises UnicodeDecodeError. Non-ascii characters are | ||||
considered invalid and mapped to arbitrary but unique code points | ||||
such that 'sysstr(a) != sysstr(b)' for all 'a != b'. | ||||
""" | ||||
if isinstance(s, builtins.str): | ||||
return s | ||||
return s.decode(u'latin-1') | ||||
Pulkit Goyal
|
r32859 | def strurl(url): | ||
"""Converts a bytes url back to str""" | ||||
Pulkit Goyal
|
r36662 | if isinstance(url, bytes): | ||
return url.decode(u'ascii') | ||||
return url | ||||
Pulkit Goyal
|
r32859 | |||
Pulkit Goyal
|
r32860 | def bytesurl(url): | ||
"""Converts a str url to bytes by encoding in ascii""" | ||||
Pulkit Goyal
|
r36662 | if isinstance(url, str): | ||
return url.encode(u'ascii') | ||||
return url | ||||
Pulkit Goyal
|
r32860 | |||
Yuya Nishihara
|
r32186 | def raisewithtb(exc, tb): | ||
"""Raise exception with the given traceback""" | ||||
raise exc.with_traceback(tb) | ||||
Yuya Nishihara
|
r32615 | def getdoc(obj): | ||
"""Get docstring as bytes; may be None so gettext() won't confuse it | ||||
with _('')""" | ||||
doc = getattr(obj, u'__doc__', None) | ||||
if doc is None: | ||||
return doc | ||||
return sysbytes(doc) | ||||
Yuya Nishihara
|
r29799 | def _wrapattrfunc(f): | ||
@functools.wraps(f) | ||||
def w(object, name, *args): | ||||
Yuya Nishihara
|
r30032 | return f(object, sysstr(name), *args) | ||
Yuya Nishihara
|
r29799 | return w | ||
Yuya Nishihara
|
r29800 | # these wrappers are automagically imported by hgloader | ||
Yuya Nishihara
|
r29799 | delattr = _wrapattrfunc(builtins.delattr) | ||
getattr = _wrapattrfunc(builtins.getattr) | ||||
hasattr = _wrapattrfunc(builtins.hasattr) | ||||
setattr = _wrapattrfunc(builtins.setattr) | ||||
Yuya Nishihara
|
r29800 | xrange = builtins.range | ||
Joerg Sonnenberger
|
r39234 | membershiprange = builtins.range | ||
Pulkit Goyal
|
r31843 | unicode = str | ||
Yuya Nishihara
|
r29799 | |||
Augie Fackler
|
r36574 | def open(name, mode='r', buffering=-1, encoding=None): | ||
return builtins.open(name, sysstr(mode), buffering, encoding) | ||||
Pulkit Goyal
|
r31149 | |||
Yuya Nishihara
|
r37117 | safehasattr = _wrapattrfunc(builtins.hasattr) | ||
Yuya Nishihara
|
r35226 | def _getoptbwrapper(orig, args, shortlist, namelist): | ||
Pulkit Goyal
|
r32864 | """ | ||
Takes bytes arguments, converts them to unicode, pass them to | ||||
getopt.getopt(), convert the returned values back to bytes and then | ||||
return them for Python 3 compatibility as getopt.getopt() don't accepts | ||||
bytes on Python 3. | ||||
""" | ||||
Pulkit Goyal
|
r30578 | args = [a.decode('latin-1') for a in args] | ||
shortlist = shortlist.decode('latin-1') | ||||
namelist = [a.decode('latin-1') for a in namelist] | ||||
Yuya Nishihara
|
r35226 | opts, args = orig(args, shortlist, namelist) | ||
Pulkit Goyal
|
r30578 | opts = [(a[0].encode('latin-1'), a[1].encode('latin-1')) | ||
for a in opts] | ||||
args = [a.encode('latin-1') for a in args] | ||||
return opts, args | ||||
Pulkit Goyal
|
r30579 | def strkwargs(dic): | ||
Pulkit Goyal
|
r32864 | """ | ||
Converts the keys of a python dictonary to str i.e. unicodes so that | ||||
they can be passed as keyword arguments as dictonaries with bytes keys | ||||
can't be passed as keyword arguments to functions on Python 3. | ||||
""" | ||||
Pulkit Goyal
|
r30579 | dic = dict((k.decode('latin-1'), v) for k, v in dic.iteritems()) | ||
return dic | ||||
def byteskwargs(dic): | ||||
Pulkit Goyal
|
r32864 | """ | ||
Converts keys of python dictonaries to bytes as they were converted to | ||||
str to pass that dictonary as a keyword argument on Python 3. | ||||
""" | ||||
Pulkit Goyal
|
r30579 | dic = dict((k.encode('latin-1'), v) for k, v in dic.iteritems()) | ||
return dic | ||||
Pulkit Goyal
|
r30678 | # TODO: handle shlex.shlex(). | ||
Matt Harbison
|
r36352 | def shlexsplit(s, comments=False, posix=True): | ||
Pulkit Goyal
|
r32864 | """ | ||
Takes bytes argument, convert it to str i.e. unicodes, pass that into | ||||
shlex.split(), convert the returned value to bytes and return that for | ||||
Python 3 compatibility as shelx.split() don't accept bytes on Python 3. | ||||
""" | ||||
Matt Harbison
|
r36352 | ret = shlex.split(s.decode('latin-1'), comments, posix) | ||
Pulkit Goyal
|
r30678 | return [a.encode('latin-1') for a in ret] | ||
Yuya Nishihara
|
r30032 | else: | ||
Yuya Nishihara
|
r31372 | import cStringIO | ||
Gregory Szorc
|
r38805 | xrange = xrange | ||
Pulkit Goyal
|
r38332 | unicode = unicode | ||
Yuya Nishihara
|
r31253 | bytechr = chr | ||
Yuya Nishihara
|
r36279 | byterepr = repr | ||
Yuya Nishihara
|
r31439 | bytestr = str | ||
Yuya Nishihara
|
r31382 | iterbytestr = iter | ||
Yuya Nishihara
|
r35922 | maybebytestr = identity | ||
Yuya Nishihara
|
r31820 | sysbytes = identity | ||
Yuya Nishihara
|
r31774 | sysstr = identity | ||
Pulkit Goyal
|
r32859 | strurl = identity | ||
Pulkit Goyal
|
r32860 | bytesurl = identity | ||
Yuya Nishihara
|
r30032 | |||
Joerg Sonnenberger
|
r39234 | class membershiprange(object): | ||
"Like xrange(a,b) but with constant-time membership test" | ||||
def __init__(self, a, b): | ||||
self._range = xrange(a, b) | ||||
def __getitem__(self, n): | ||||
return self._range[n] | ||||
def __hash__(self): | ||||
return hash(self._range) | ||||
def __iter__(self): | ||||
return iter(self._range) | ||||
def __len__(self): | ||||
return len(self._range) | ||||
def __reversed__(self): | ||||
return reversed(self._range) | ||||
def __contains__(self, n): | ||||
if not self._range: | ||||
return False | ||||
return n >= self._range[0] and n <= self._range[-1] | ||||
Yuya Nishihara
|
r32186 | # this can't be parsed on Python 3 | ||
exec('def raisewithtb(exc, tb):\n' | ||||
' raise exc, None, tb\n') | ||||
Martijn Pieters
|
r30133 | def fsencode(filename): | ||
Pulkit Goyal
|
r32864 | """ | ||
Partial backport from os.py in Python 3, which only accepts bytes. | ||||
In Python 2, our paths should only ever be bytes, a unicode path | ||||
indicates a bug. | ||||
""" | ||||
Martijn Pieters
|
r30133 | if isinstance(filename, str): | ||
return filename | ||||
Martijn Pieters
|
r30119 | else: | ||
Martijn Pieters
|
r30133 | raise TypeError( | ||
"expect str, not %s" % type(filename).__name__) | ||||
Martijn Pieters
|
r30119 | |||
Pulkit Goyal
|
r30300 | # In Python 2, fsdecode() has a very chance to receive bytes. So it's | ||
# better not to touch Python 2 part as it's already working fine. | ||||
Yuya Nishihara
|
r31774 | fsdecode = identity | ||
Pulkit Goyal
|
r30300 | |||
Yuya Nishihara
|
r32615 | def getdoc(obj): | ||
return getattr(obj, '__doc__', None) | ||||
Yuya Nishihara
|
r37117 | _notset = object() | ||
def safehasattr(thing, attr): | ||||
return getattr(thing, attr, _notset) is not _notset | ||||
Yuya Nishihara
|
r35226 | def _getoptbwrapper(orig, args, shortlist, namelist): | ||
return orig(args, shortlist, namelist) | ||||
Pulkit Goyal
|
r30578 | |||
Yuya Nishihara
|
r31774 | strkwargs = identity | ||
byteskwargs = identity | ||||
Pulkit Goyal
|
r30579 | |||
Yuya Nishihara
|
r36666 | oscurdir = os.curdir | ||
Yuya Nishihara
|
r31775 | oslinesep = os.linesep | ||
Pulkit Goyal
|
r30302 | osname = os.name | ||
Pulkit Goyal
|
r30303 | ospathsep = os.pathsep | ||
Yuya Nishihara
|
r36665 | ospardir = os.pardir | ||
Pulkit Goyal
|
r30303 | ossep = os.sep | ||
Pulkit Goyal
|
r30623 | osaltsep = os.altsep | ||
Yuya Nishihara
|
r30472 | stdin = sys.stdin | ||
stdout = sys.stdout | ||||
stderr = sys.stderr | ||||
Augie Fackler
|
r31277 | if getattr(sys, 'argv', None) is not None: | ||
sysargv = sys.argv | ||||
Pulkit Goyal
|
r30624 | sysplatform = sys.platform | ||
Pulkit Goyal
|
r30500 | getcwd = os.getcwd | ||
Pulkit Goyal
|
r30668 | sysexecutable = sys.executable | ||
Pulkit Goyal
|
r30678 | shlexsplit = shlex.split | ||
Gregory Szorc
|
r36976 | bytesio = cStringIO.StringIO | ||
stringio = bytesio | ||||
Augie Fackler
|
r31501 | maplist = map | ||
Yuya Nishihara
|
r37082 | rangelist = range | ||
Pulkit Goyal
|
r35406 | ziplist = zip | ||
Yuya Nishihara
|
r33853 | rawinput = raw_input | ||
Augie Fackler
|
r36196 | getargspec = inspect.getargspec | ||
Jun Wu
|
r34640 | |||
isjython = sysplatform.startswith('java') | ||||
Jun Wu
|
r34645 | |||
isdarwin = sysplatform == 'darwin' | ||||
isposix = osname == 'posix' | ||||
iswindows = osname == 'nt' | ||||
Yuya Nishihara
|
r35226 | |||
def getoptb(args, shortlist, namelist): | ||||
return _getoptbwrapper(getopt.getopt, args, shortlist, namelist) | ||||
def gnugetoptb(args, shortlist, namelist): | ||||
return _getoptbwrapper(getopt.gnu_getopt, args, shortlist, namelist) | ||||
Yuya Nishihara
|
r38182 | |||
Yuya Nishihara
|
r38183 | def mkdtemp(suffix=b'', prefix=b'tmp', dir=None): | ||
return tempfile.mkdtemp(suffix, prefix, dir) | ||||
Yuya Nishihara
|
r38182 | # text=True is not supported; use util.from/tonativeeol() instead | ||
def mkstemp(suffix=b'', prefix=b'tmp', dir=None): | ||||
return tempfile.mkstemp(suffix, prefix, dir) | ||||
Yuya Nishihara
|
r38184 | |||
# mode must include 'b'ytes as encoding= is not supported | ||||
def namedtempfile(mode=b'w+b', bufsize=-1, suffix=b'', prefix=b'tmp', dir=None, | ||||
delete=True): | ||||
mode = sysstr(mode) | ||||
assert r'b' in mode | ||||
return tempfile.NamedTemporaryFile(mode, bufsize, suffix=suffix, | ||||
prefix=prefix, dir=dir, delete=delete) | ||||