pycompat.py
380 lines
| 11.4 KiB
| text/x-python
|
PythonLexer
/ mercurial / pycompat.py
timeless
|
r28818 | # pycompat.py - portability shim for python 3 | ||
# | ||||
# This software may be used and distributed according to the terms of the | ||||
# GNU General Public License version 2 or any later version. | ||||
"""Mercurial portability shim for python 3. | ||||
This contains aliases to hide python version-specific details from the core. | ||||
""" | ||||
from __future__ import absolute_import | ||||
Pulkit Goyal
|
r30578 | import getopt | ||
Augie Fackler
|
r36196 | import inspect | ||
Pulkit Goyal
|
r30302 | import os | ||
Pulkit Goyal
|
r30678 | import shlex | ||
Pulkit Goyal
|
r29584 | import sys | ||
Yuya Nishihara
|
r30030 | ispy3 = (sys.version_info[0] >= 3) | ||
Yuya Nishihara
|
r33628 | ispypy = (r'__pypy__' in sys.builtin_module_names) | ||
Yuya Nishihara
|
r30030 | |||
if not ispy3: | ||||
Gregory Szorc
|
r31934 | import cookielib | ||
Pulkit Goyal
|
r29324 | import cPickle as pickle | ||
Pulkit Goyal
|
r29455 | import httplib | ||
Pulkit Goyal
|
r29584 | import Queue as _queue | ||
Pulkit Goyal
|
r29433 | import SocketServer as socketserver | ||
Pulkit Goyal
|
r29432 | import xmlrpclib | ||
Pulkit Goyal
|
r29584 | else: | ||
Gregory Szorc
|
r31942 | import http.cookiejar as cookielib | ||
Pulkit Goyal
|
r29584 | import http.client as httplib | ||
import pickle | ||||
import queue as _queue | ||||
import socketserver | ||||
Pulkit Goyal
|
r29432 | import xmlrpc.client as xmlrpclib | ||
Pulkit Goyal
|
r29431 | |||
Pulkit Goyal
|
r32865 | empty = _queue.Empty | ||
queue = _queue.Queue | ||||
Yuya Nishihara
|
r31774 | def identity(a): | ||
return a | ||||
Yuya Nishihara
|
r30030 | if ispy3: | ||
Yuya Nishihara
|
r29797 | import builtins | ||
Yuya Nishihara
|
r29799 | import functools | ||
Yuya Nishihara
|
r31372 | import io | ||
Martin von Zweigbergk
|
r31424 | import struct | ||
Yuya Nishihara
|
r31372 | |||
Martijn Pieters
|
r30119 | fsencode = os.fsencode | ||
Pulkit Goyal
|
r30300 | fsdecode = os.fsdecode | ||
Yuya Nishihara
|
r36666 | oscurdir = os.curdir.encode('ascii') | ||
Yuya Nishihara
|
r31775 | oslinesep = os.linesep.encode('ascii') | ||
Pulkit Goyal
|
r30302 | osname = os.name.encode('ascii') | ||
Pulkit Goyal
|
r30303 | ospathsep = os.pathsep.encode('ascii') | ||
Yuya Nishihara
|
r36665 | ospardir = os.pardir.encode('ascii') | ||
Pulkit Goyal
|
r30303 | ossep = os.sep.encode('ascii') | ||
Pulkit Goyal
|
r30623 | osaltsep = os.altsep | ||
if osaltsep: | ||||
osaltsep = osaltsep.encode('ascii') | ||||
Pulkit Goyal
|
r30500 | # os.getcwd() on Python 3 returns string, but it has os.getcwdb() which | ||
# returns bytes. | ||||
getcwd = os.getcwdb | ||||
Pulkit Goyal
|
r30624 | sysplatform = sys.platform.encode('ascii') | ||
Pulkit Goyal
|
r30668 | sysexecutable = sys.executable | ||
if sysexecutable: | ||||
sysexecutable = os.fsencode(sysexecutable) | ||||
Gregory Szorc
|
r36976 | bytesio = io.BytesIO | ||
# TODO deprecate stringio name, as it is a lie on Python 3. | ||||
stringio = bytesio | ||||
Yuya Nishihara
|
r36952 | |||
def maplist(*args): | ||||
return list(map(*args)) | ||||
Yuya Nishihara
|
r37082 | def rangelist(*args): | ||
return list(range(*args)) | ||||
Yuya Nishihara
|
r36952 | def ziplist(*args): | ||
return list(zip(*args)) | ||||
Yuya Nishihara
|
r33853 | rawinput = input | ||
Augie Fackler
|
r36196 | getargspec = inspect.getfullargspec | ||
Yuya Nishihara
|
r30334 | |||
Yuya Nishihara
|
r30472 | # TODO: .buffer might not exist if std streams were replaced; we'll need | ||
# a silly wrapper to make a bytes stream backed by a unicode one. | ||||
stdin = sys.stdin.buffer | ||||
stdout = sys.stdout.buffer | ||||
stderr = sys.stderr.buffer | ||||
Yuya Nishihara
|
r30334 | # Since Python 3 converts argv to wchar_t type by Py_DecodeLocale() on Unix, | ||
# we can use os.fsencode() to get back bytes argv. | ||||
# | ||||
# https://hg.python.org/cpython/file/v3.5.1/Programs/python.c#l55 | ||||
# | ||||
# TODO: On Windows, the native argv is wchar_t, so we'll need a different | ||||
# workaround to simulate the Python 2 (i.e. ANSI Win32 API) behavior. | ||||
Augie Fackler
|
r31277 | if getattr(sys, 'argv', None) is not None: | ||
sysargv = list(map(os.fsencode, sys.argv)) | ||||
Yuya Nishihara
|
r29797 | |||
Martin von Zweigbergk
|
r31424 | bytechr = struct.Struct('>B').pack | ||
Yuya Nishihara
|
r36279 | byterepr = b'%r'.__mod__ | ||
Yuya Nishihara
|
r31253 | |||
Yuya Nishihara
|
r31439 | class bytestr(bytes): | ||
"""A bytes which mostly acts as a Python 2 str | ||||
>>> bytestr(), bytestr(bytearray(b'foo')), bytestr(u'ascii'), bytestr(1) | ||||
Yuya Nishihara
|
r35921 | ('', 'foo', 'ascii', '1') | ||
Yuya Nishihara
|
r31439 | >>> s = bytestr(b'foo') | ||
>>> assert s is bytestr(s) | ||||
Yuya Nishihara
|
r32450 | __bytes__() should be called if provided: | ||
>>> class bytesable(object): | ||||
... def __bytes__(self): | ||||
... return b'bytes' | ||||
>>> bytestr(bytesable()) | ||||
Yuya Nishihara
|
r35921 | 'bytes' | ||
Yuya Nishihara
|
r32450 | |||
Yuya Nishihara
|
r31439 | There's no implicit conversion from non-ascii str as its encoding is | ||
unknown: | ||||
>>> bytestr(chr(0x80)) # doctest: +ELLIPSIS | ||||
Traceback (most recent call last): | ||||
... | ||||
UnicodeEncodeError: ... | ||||
Comparison between bytestr and bytes should work: | ||||
>>> assert bytestr(b'foo') == b'foo' | ||||
>>> assert b'foo' == bytestr(b'foo') | ||||
>>> assert b'f' in bytestr(b'foo') | ||||
>>> assert bytestr(b'f') in b'foo' | ||||
Sliced elements should be bytes, not integer: | ||||
>>> s[1], s[:2] | ||||
(b'o', b'fo') | ||||
>>> list(s), list(reversed(s)) | ||||
([b'f', b'o', b'o'], [b'o', b'o', b'f']) | ||||
As bytestr type isn't propagated across operations, you need to cast | ||||
bytes to bytestr explicitly: | ||||
>>> s = bytestr(b'foo').upper() | ||||
>>> t = bytestr(s) | ||||
>>> s[0], t[0] | ||||
(70, b'F') | ||||
Be careful to not pass a bytestr object to a function which expects | ||||
bytearray-like behavior. | ||||
>>> t = bytes(t) # cast to bytes | ||||
>>> assert type(t) is bytes | ||||
""" | ||||
def __new__(cls, s=b''): | ||||
if isinstance(s, bytestr): | ||||
return s | ||||
Yuya Nishihara
|
r32450 | if (not isinstance(s, (bytes, bytearray)) | ||
and not hasattr(s, u'__bytes__')): # hasattr-py3-only | ||||
Yuya Nishihara
|
r31439 | s = str(s).encode(u'ascii') | ||
return bytes.__new__(cls, s) | ||||
def __getitem__(self, key): | ||||
s = bytes.__getitem__(self, key) | ||||
if not isinstance(s, bytes): | ||||
s = bytechr(s) | ||||
return s | ||||
def __iter__(self): | ||||
return iterbytestr(bytes.__iter__(self)) | ||||
Yuya Nishihara
|
r35921 | def __repr__(self): | ||
return bytes.__repr__(self)[1:] # drop b'' | ||||
Yuya Nishihara
|
r31382 | def iterbytestr(s): | ||
"""Iterate bytes as if it were a str object of Python 2""" | ||||
Martin von Zweigbergk
|
r31425 | return map(bytechr, s) | ||
Yuya Nishihara
|
r31382 | |||
Yuya Nishihara
|
r35922 | def maybebytestr(s): | ||
"""Promote bytes to bytestr""" | ||||
if isinstance(s, bytes): | ||||
return bytestr(s) | ||||
return s | ||||
Yuya Nishihara
|
r31820 | def sysbytes(s): | ||
"""Convert an internal str (e.g. keyword, __doc__) back to bytes | ||||
This never raises UnicodeEncodeError, but only ASCII characters | ||||
can be round-trip by sysstr(sysbytes(s)). | ||||
""" | ||||
return s.encode(u'utf-8') | ||||
Yuya Nishihara
|
r30032 | def sysstr(s): | ||
"""Return a keyword str to be passed to Python functions such as | ||||
getattr() and str.encode() | ||||
This never raises UnicodeDecodeError. Non-ascii characters are | ||||
considered invalid and mapped to arbitrary but unique code points | ||||
such that 'sysstr(a) != sysstr(b)' for all 'a != b'. | ||||
""" | ||||
if isinstance(s, builtins.str): | ||||
return s | ||||
return s.decode(u'latin-1') | ||||
Pulkit Goyal
|
r32859 | def strurl(url): | ||
"""Converts a bytes url back to str""" | ||||
Pulkit Goyal
|
r36662 | if isinstance(url, bytes): | ||
return url.decode(u'ascii') | ||||
return url | ||||
Pulkit Goyal
|
r32859 | |||
Pulkit Goyal
|
r32860 | def bytesurl(url): | ||
"""Converts a str url to bytes by encoding in ascii""" | ||||
Pulkit Goyal
|
r36662 | if isinstance(url, str): | ||
return url.encode(u'ascii') | ||||
return url | ||||
Pulkit Goyal
|
r32860 | |||
Yuya Nishihara
|
r32186 | def raisewithtb(exc, tb): | ||
"""Raise exception with the given traceback""" | ||||
raise exc.with_traceback(tb) | ||||
Yuya Nishihara
|
r32615 | def getdoc(obj): | ||
"""Get docstring as bytes; may be None so gettext() won't confuse it | ||||
with _('')""" | ||||
doc = getattr(obj, u'__doc__', None) | ||||
if doc is None: | ||||
return doc | ||||
return sysbytes(doc) | ||||
Yuya Nishihara
|
r29799 | def _wrapattrfunc(f): | ||
@functools.wraps(f) | ||||
def w(object, name, *args): | ||||
Yuya Nishihara
|
r30032 | return f(object, sysstr(name), *args) | ||
Yuya Nishihara
|
r29799 | return w | ||
Yuya Nishihara
|
r29800 | # these wrappers are automagically imported by hgloader | ||
Yuya Nishihara
|
r29799 | delattr = _wrapattrfunc(builtins.delattr) | ||
getattr = _wrapattrfunc(builtins.getattr) | ||||
hasattr = _wrapattrfunc(builtins.hasattr) | ||||
setattr = _wrapattrfunc(builtins.setattr) | ||||
Yuya Nishihara
|
r29800 | xrange = builtins.range | ||
Pulkit Goyal
|
r31843 | unicode = str | ||
Yuya Nishihara
|
r29799 | |||
Augie Fackler
|
r36574 | def open(name, mode='r', buffering=-1, encoding=None): | ||
return builtins.open(name, sysstr(mode), buffering, encoding) | ||||
Pulkit Goyal
|
r31149 | |||
Yuya Nishihara
|
r37117 | safehasattr = _wrapattrfunc(builtins.hasattr) | ||
Yuya Nishihara
|
r35226 | def _getoptbwrapper(orig, args, shortlist, namelist): | ||
Pulkit Goyal
|
r32864 | """ | ||
Takes bytes arguments, converts them to unicode, pass them to | ||||
getopt.getopt(), convert the returned values back to bytes and then | ||||
return them for Python 3 compatibility as getopt.getopt() don't accepts | ||||
bytes on Python 3. | ||||
""" | ||||
Pulkit Goyal
|
r30578 | args = [a.decode('latin-1') for a in args] | ||
shortlist = shortlist.decode('latin-1') | ||||
namelist = [a.decode('latin-1') for a in namelist] | ||||
Yuya Nishihara
|
r35226 | opts, args = orig(args, shortlist, namelist) | ||
Pulkit Goyal
|
r30578 | opts = [(a[0].encode('latin-1'), a[1].encode('latin-1')) | ||
for a in opts] | ||||
args = [a.encode('latin-1') for a in args] | ||||
return opts, args | ||||
Pulkit Goyal
|
r30579 | def strkwargs(dic): | ||
Pulkit Goyal
|
r32864 | """ | ||
Converts the keys of a python dictonary to str i.e. unicodes so that | ||||
they can be passed as keyword arguments as dictonaries with bytes keys | ||||
can't be passed as keyword arguments to functions on Python 3. | ||||
""" | ||||
Pulkit Goyal
|
r30579 | dic = dict((k.decode('latin-1'), v) for k, v in dic.iteritems()) | ||
return dic | ||||
def byteskwargs(dic): | ||||
Pulkit Goyal
|
r32864 | """ | ||
Converts keys of python dictonaries to bytes as they were converted to | ||||
str to pass that dictonary as a keyword argument on Python 3. | ||||
""" | ||||
Pulkit Goyal
|
r30579 | dic = dict((k.encode('latin-1'), v) for k, v in dic.iteritems()) | ||
return dic | ||||
Pulkit Goyal
|
r30678 | # TODO: handle shlex.shlex(). | ||
Matt Harbison
|
r36352 | def shlexsplit(s, comments=False, posix=True): | ||
Pulkit Goyal
|
r32864 | """ | ||
Takes bytes argument, convert it to str i.e. unicodes, pass that into | ||||
shlex.split(), convert the returned value to bytes and return that for | ||||
Python 3 compatibility as shelx.split() don't accept bytes on Python 3. | ||||
""" | ||||
Matt Harbison
|
r36352 | ret = shlex.split(s.decode('latin-1'), comments, posix) | ||
Pulkit Goyal
|
r30678 | return [a.encode('latin-1') for a in ret] | ||
Gregory Szorc
|
r36062 | def emailparser(*args, **kwargs): | ||
import email.parser | ||||
return email.parser.BytesParser(*args, **kwargs) | ||||
Yuya Nishihara
|
r30032 | else: | ||
Yuya Nishihara
|
r31372 | import cStringIO | ||
Yuya Nishihara
|
r31253 | bytechr = chr | ||
Yuya Nishihara
|
r36279 | byterepr = repr | ||
Yuya Nishihara
|
r31439 | bytestr = str | ||
Yuya Nishihara
|
r31382 | iterbytestr = iter | ||
Yuya Nishihara
|
r35922 | maybebytestr = identity | ||
Yuya Nishihara
|
r31820 | sysbytes = identity | ||
Yuya Nishihara
|
r31774 | sysstr = identity | ||
Pulkit Goyal
|
r32859 | strurl = identity | ||
Pulkit Goyal
|
r32860 | bytesurl = identity | ||
Yuya Nishihara
|
r30032 | |||
Yuya Nishihara
|
r32186 | # this can't be parsed on Python 3 | ||
exec('def raisewithtb(exc, tb):\n' | ||||
' raise exc, None, tb\n') | ||||
Martijn Pieters
|
r30133 | def fsencode(filename): | ||
Pulkit Goyal
|
r32864 | """ | ||
Partial backport from os.py in Python 3, which only accepts bytes. | ||||
In Python 2, our paths should only ever be bytes, a unicode path | ||||
indicates a bug. | ||||
""" | ||||
Martijn Pieters
|
r30133 | if isinstance(filename, str): | ||
return filename | ||||
Martijn Pieters
|
r30119 | else: | ||
Martijn Pieters
|
r30133 | raise TypeError( | ||
"expect str, not %s" % type(filename).__name__) | ||||
Martijn Pieters
|
r30119 | |||
Pulkit Goyal
|
r30300 | # In Python 2, fsdecode() has a very chance to receive bytes. So it's | ||
# better not to touch Python 2 part as it's already working fine. | ||||
Yuya Nishihara
|
r31774 | fsdecode = identity | ||
Pulkit Goyal
|
r30300 | |||
Yuya Nishihara
|
r32615 | def getdoc(obj): | ||
return getattr(obj, '__doc__', None) | ||||
Yuya Nishihara
|
r37117 | _notset = object() | ||
def safehasattr(thing, attr): | ||||
return getattr(thing, attr, _notset) is not _notset | ||||
Yuya Nishihara
|
r35226 | def _getoptbwrapper(orig, args, shortlist, namelist): | ||
return orig(args, shortlist, namelist) | ||||
Pulkit Goyal
|
r30578 | |||
Yuya Nishihara
|
r31774 | strkwargs = identity | ||
byteskwargs = identity | ||||
Pulkit Goyal
|
r30579 | |||
Yuya Nishihara
|
r36666 | oscurdir = os.curdir | ||
Yuya Nishihara
|
r31775 | oslinesep = os.linesep | ||
Pulkit Goyal
|
r30302 | osname = os.name | ||
Pulkit Goyal
|
r30303 | ospathsep = os.pathsep | ||
Yuya Nishihara
|
r36665 | ospardir = os.pardir | ||
Pulkit Goyal
|
r30303 | ossep = os.sep | ||
Pulkit Goyal
|
r30623 | osaltsep = os.altsep | ||
Yuya Nishihara
|
r30472 | stdin = sys.stdin | ||
stdout = sys.stdout | ||||
stderr = sys.stderr | ||||
Augie Fackler
|
r31277 | if getattr(sys, 'argv', None) is not None: | ||
sysargv = sys.argv | ||||
Pulkit Goyal
|
r30624 | sysplatform = sys.platform | ||
Pulkit Goyal
|
r30500 | getcwd = os.getcwd | ||
Pulkit Goyal
|
r30668 | sysexecutable = sys.executable | ||
Pulkit Goyal
|
r30678 | shlexsplit = shlex.split | ||
Gregory Szorc
|
r36976 | bytesio = cStringIO.StringIO | ||
stringio = bytesio | ||||
Augie Fackler
|
r31501 | maplist = map | ||
Yuya Nishihara
|
r37082 | rangelist = range | ||
Pulkit Goyal
|
r35406 | ziplist = zip | ||
Yuya Nishihara
|
r33853 | rawinput = raw_input | ||
Augie Fackler
|
r36196 | getargspec = inspect.getargspec | ||
Jun Wu
|
r34640 | |||
Gregory Szorc
|
r36062 | def emailparser(*args, **kwargs): | ||
import email.parser | ||||
return email.parser.Parser(*args, **kwargs) | ||||
Jun Wu
|
r34640 | isjython = sysplatform.startswith('java') | ||
Jun Wu
|
r34645 | |||
isdarwin = sysplatform == 'darwin' | ||||
isposix = osname == 'posix' | ||||
iswindows = osname == 'nt' | ||||
Yuya Nishihara
|
r35226 | |||
def getoptb(args, shortlist, namelist): | ||||
return _getoptbwrapper(getopt.getopt, args, shortlist, namelist) | ||||
def gnugetoptb(args, shortlist, namelist): | ||||
return _getoptbwrapper(getopt.gnu_getopt, args, shortlist, namelist) | ||||