py3compat.py
332 lines
| 10.4 KiB
| text/x-python
|
PythonLexer
Thomas Kluyver
|
r4740 | # coding: utf-8 | ||
"""Compatibility tricks for Python 3. Mainly to do with unicode.""" | ||||
Thomas Kluyver
|
r4894 | import functools | ||
Thomas Kluyver
|
r13447 | import os | ||
Thomas Kluyver
|
r4730 | import sys | ||
Thomas Kluyver
|
r4890 | import re | ||
Min RK
|
r21121 | import shutil | ||
Thomas Kluyver
|
r4759 | import types | ||
Brandon Parsons
|
r6655 | |||
Brandon Parsons
|
r6716 | from .encoding import DEFAULT_ENCODING | ||
Thomas Kluyver
|
r4730 | |||
def no_code(x, encoding=None): | ||||
return x | ||||
def decode(s, encoding=None): | ||||
Brandon Parsons
|
r6716 | encoding = encoding or DEFAULT_ENCODING | ||
Thomas Kluyver
|
r4730 | return s.decode(encoding, "replace") | ||
def encode(u, encoding=None): | ||||
Brandon Parsons
|
r6716 | encoding = encoding or DEFAULT_ENCODING | ||
Thomas Kluyver
|
r4730 | return u.encode(encoding, "replace") | ||
Brandon Parsons
|
r6651 | |||
Thomas Kluyver
|
r4731 | def cast_unicode(s, encoding=None): | ||
if isinstance(s, bytes): | ||||
return decode(s, encoding) | ||||
return s | ||||
def cast_bytes(s, encoding=None): | ||||
if not isinstance(s, bytes): | ||||
return encode(s, encoding) | ||||
return s | ||||
Thomas Kluyver
|
r4730 | |||
Min RK
|
r19203 | def buffer_to_bytes(buf): | ||
"""Cast a buffer object to bytes""" | ||||
if not isinstance(buf, bytes): | ||||
buf = bytes(buf) | ||||
return buf | ||||
Thomas Kluyver
|
r4894 | def _modify_str_or_docstring(str_change_func): | ||
@functools.wraps(str_change_func) | ||||
def wrapper(func_or_str): | ||||
Thomas Kluyver
|
r13353 | if isinstance(func_or_str, string_types): | ||
Thomas Kluyver
|
r4894 | func = None | ||
doc = func_or_str | ||||
else: | ||||
func = func_or_str | ||||
doc = func.__doc__ | ||||
doc = str_change_func(doc) | ||||
if func: | ||||
func.__doc__ = doc | ||||
return func | ||||
return doc | ||||
return wrapper | ||||
MinRK
|
r10635 | def safe_unicode(e): | ||
"""unicode(e) with various fallbacks. Used for exceptions, which may not be | ||||
safe to call unicode() on. | ||||
""" | ||||
try: | ||||
Thomas Kluyver
|
r13353 | return unicode_type(e) | ||
MinRK
|
r10635 | except UnicodeError: | ||
pass | ||||
try: | ||||
rossant
|
r12327 | return str_to_unicode(str(e)) | ||
MinRK
|
r10635 | except UnicodeError: | ||
pass | ||||
try: | ||||
rossant
|
r12327 | return str_to_unicode(repr(e)) | ||
MinRK
|
r10635 | except UnicodeError: | ||
pass | ||||
return u'Unrecoverably corrupt evalue' | ||||
Min RK
|
r21121 | # shutil.which from Python 3.4 | ||
def _shutil_which(cmd, mode=os.F_OK | os.X_OK, path=None): | ||||
"""Given a command, mode, and a PATH string, return the path which | ||||
conforms to the given mode on the PATH, or None if there is no such | ||||
file. | ||||
`mode` defaults to os.F_OK | os.X_OK. `path` defaults to the result | ||||
of os.environ.get("PATH"), or can be overridden with a custom search | ||||
path. | ||||
This is a backport of shutil.which from Python 3.4 | ||||
""" | ||||
# Check that a given file can be accessed with the correct mode. | ||||
# Additionally check that `file` is not a directory, as on Windows | ||||
# directories pass the os.access check. | ||||
def _access_check(fn, mode): | ||||
return (os.path.exists(fn) and os.access(fn, mode) | ||||
and not os.path.isdir(fn)) | ||||
# If we're given a path with a directory part, look it up directly rather | ||||
# than referring to PATH directories. This includes checking relative to the | ||||
# current directory, e.g. ./script | ||||
if os.path.dirname(cmd): | ||||
if _access_check(cmd, mode): | ||||
return cmd | ||||
return None | ||||
if path is None: | ||||
path = os.environ.get("PATH", os.defpath) | ||||
if not path: | ||||
return None | ||||
path = path.split(os.pathsep) | ||||
if sys.platform == "win32": | ||||
# The current directory takes precedence on Windows. | ||||
if not os.curdir in path: | ||||
path.insert(0, os.curdir) | ||||
# PATHEXT is necessary to check on Windows. | ||||
pathext = os.environ.get("PATHEXT", "").split(os.pathsep) | ||||
# See if the given file matches any of the expected path extensions. | ||||
# This will allow us to short circuit when given "python.exe". | ||||
# If it does match, only test that one, otherwise we have to try | ||||
# others. | ||||
if any(cmd.lower().endswith(ext.lower()) for ext in pathext): | ||||
files = [cmd] | ||||
else: | ||||
files = [cmd + ext for ext in pathext] | ||||
else: | ||||
# On other platforms you don't have things like PATHEXT to tell you | ||||
# what file suffixes are executable, so just pass on cmd as-is. | ||||
files = [cmd] | ||||
seen = set() | ||||
for dir in path: | ||||
normdir = os.path.normcase(dir) | ||||
if not normdir in seen: | ||||
seen.add(normdir) | ||||
for thefile in files: | ||||
name = os.path.join(dir, thefile) | ||||
if _access_check(name, mode): | ||||
return name | ||||
return None | ||||
Thomas Kluyver
|
r4730 | if sys.version_info[0] >= 3: | ||
PY3 = True | ||||
MinRK
|
r14895 | # keep reference to builtin_mod because the kernel overrides that value | ||
# to forward requests to a frontend. | ||||
def input(prompt=''): | ||||
return builtin_mod.input(prompt) | ||||
Thomas Kluyver
|
r4730 | builtin_mod_name = "builtins" | ||
Thomas Kluyver
|
r13351 | import builtins as builtin_mod | ||
Thomas Kluyver
|
r4730 | |||
str_to_unicode = no_code | ||||
unicode_to_str = no_code | ||||
str_to_bytes = encode | ||||
bytes_to_str = decode | ||||
Thomas Kluyver
|
r4758 | cast_bytes_py2 = no_code | ||
Thomas Kluyver
|
r13893 | cast_unicode_py2 = no_code | ||
Min RK
|
r19203 | buffer_to_bytes_py2 = no_code | ||
Thomas Kluyver
|
r4730 | |||
Thomas Kluyver
|
r9197 | string_types = (str,) | ||
Thomas Kluyver
|
r13153 | unicode_type = str | ||
Thomas Kluyver
|
r9197 | |||
Min RK
|
r21121 | which = shutil.which | ||
Thomas Kluyver
|
r4740 | def isidentifier(s, dotted=False): | ||
if dotted: | ||||
return all(isidentifier(a) for a in s.split(".")) | ||||
return s.isidentifier() | ||||
Thomas Kluyver
|
r17299 | |||
Thomas Kluyver
|
r13356 | xrange = range | ||
Thomas Kluyver
|
r13373 | def iteritems(d): return iter(d.items()) | ||
def itervalues(d): return iter(d.values()) | ||||
Thomas Kluyver
|
r13447 | getcwd = os.getcwd | ||
Thomas Kluyver
|
r4759 | |||
MethodType = types.MethodType | ||||
Thomas Ballinger
|
r18526 | |||
def execfile(fname, glob, loc=None, compiler=None): | ||||
MinRK
|
r4780 | loc = loc if (loc is not None) else glob | ||
Bradley M. Froehle
|
r7803 | with open(fname, 'rb') as f: | ||
Thomas Ballinger
|
r18526 | compiler = compiler or compile | ||
exec(compiler(f.read(), fname, 'exec'), glob, loc) | ||||
Thomas Kluyver
|
r4890 | |||
# Refactor print statements in doctests. | ||||
_print_statement_re = re.compile(r"\bprint (?P<expr>.*)$", re.MULTILINE) | ||||
def _print_statement_sub(match): | ||||
expr = match.groups('expr') | ||||
return "print(%s)" % expr | ||||
Thomas Kluyver
|
r4894 | |||
@_modify_str_or_docstring | ||||
def doctest_refactor_print(doc): | ||||
Thomas Kluyver
|
r4890 | """Refactor 'print x' statements in a doctest to print(x) style. 2to3 | ||
unfortunately doesn't pick up on our doctests. | ||||
Can accept a string or a function, so it can be used as a decorator.""" | ||||
Thomas Kluyver
|
r4894 | return _print_statement_re.sub(_print_statement_sub, doc) | ||
# Abstract u'abc' syntax: | ||||
@_modify_str_or_docstring | ||||
def u_format(s): | ||||
""""{u}'abc'" --> "'abc'" (Python 3) | ||||
Thomas Kluyver
|
r4890 | |||
Thomas Kluyver
|
r4894 | Accepts a string or a function, so it can be used as a decorator.""" | ||
return s.format(u='') | ||||
MinRK
|
r16505 | |||
def get_closure(f): | ||||
"""Get a function's closure attribute""" | ||||
return f.__closure__ | ||||
Thomas Kluyver
|
r4740 | |||
Thomas Kluyver
|
r4730 | else: | ||
PY3 = False | ||||
MinRK
|
r14895 | # keep reference to builtin_mod because the kernel overrides that value | ||
# to forward requests to a frontend. | ||||
def input(prompt=''): | ||||
return builtin_mod.raw_input(prompt) | ||||
Thomas Kluyver
|
r4730 | builtin_mod_name = "__builtin__" | ||
Thomas Kluyver
|
r13351 | import __builtin__ as builtin_mod | ||
Thomas Kluyver
|
r4730 | |||
str_to_unicode = decode | ||||
unicode_to_str = encode | ||||
str_to_bytes = no_code | ||||
bytes_to_str = no_code | ||||
Thomas Kluyver
|
r4758 | cast_bytes_py2 = cast_bytes | ||
Thomas Kluyver
|
r13893 | cast_unicode_py2 = cast_unicode | ||
Min RK
|
r19203 | buffer_to_bytes_py2 = buffer_to_bytes | ||
Thomas Kluyver
|
r4740 | |||
Thomas Kluyver
|
r9197 | string_types = (str, unicode) | ||
Thomas Kluyver
|
r13153 | unicode_type = unicode | ||
Thomas Kluyver
|
r9197 | |||
Thomas Kluyver
|
r4740 | import re | ||
_name_re = re.compile(r"[a-zA-Z_][a-zA-Z0-9_]*$") | ||||
def isidentifier(s, dotted=False): | ||||
if dotted: | ||||
return all(isidentifier(a) for a in s.split(".")) | ||||
return bool(_name_re.match(s)) | ||||
Thomas Kluyver
|
r4743 | |||
Thomas Kluyver
|
r13356 | xrange = xrange | ||
Thomas Kluyver
|
r13373 | def iteritems(d): return d.iteritems() | ||
def itervalues(d): return d.itervalues() | ||||
Thomas Kluyver
|
r13447 | getcwd = os.getcwdu | ||
Thomas Kluyver
|
r13356 | |||
Thomas Kluyver
|
r4759 | def MethodType(func, instance): | ||
return types.MethodType(func, instance, type(instance)) | ||||
MinRK
|
r4780 | |||
Thomas Kluyver
|
r4890 | def doctest_refactor_print(func_or_str): | ||
return func_or_str | ||||
Thomas Kluyver
|
r4730 | |||
MinRK
|
r16505 | def get_closure(f): | ||
"""Get a function's closure attribute""" | ||||
return f.func_closure | ||||
Min RK
|
r21121 | |||
which = _shutil_which | ||||
Jörgen Stenarson
|
r5089 | |||
Thomas Kluyver
|
r4894 | # Abstract u'abc' syntax: | ||
@_modify_str_or_docstring | ||||
def u_format(s): | ||||
""""{u}'abc'" --> "u'abc'" (Python 2) | ||||
Accepts a string or a function, so it can be used as a decorator.""" | ||||
return s.format(u='u') | ||||
Jörgen Stenarson
|
r5089 | |||
Jörgen Stenarson
|
r5090 | if sys.platform == 'win32': | ||
Thomas Ballinger
|
r18526 | def execfile(fname, glob=None, loc=None, compiler=None): | ||
Jörgen Stenarson
|
r5090 | loc = loc if (loc is not None) else glob | ||
Matthias Bussonnier
|
r18037 | scripttext = builtin_mod.open(fname).read()+ '\n' | ||
Thomas Kluyver
|
r5133 | # compile converts unicode filename to str assuming | ||
# ascii. Let's do the conversion before calling compile | ||||
Jörgen Stenarson
|
r5090 | if isinstance(fname, unicode): | ||
filename = unicode_to_str(fname) | ||||
else: | ||||
filename = fname | ||||
Thomas Ballinger
|
r18526 | compiler = compiler or compile | ||
exec(compiler(scripttext, filename, 'exec'), glob, loc) | ||||
Jörgen Stenarson
|
r5090 | else: | ||
Thomas Ballinger
|
r18526 | def execfile(fname, glob=None, loc=None, compiler=None): | ||
Jörgen Stenarson
|
r5090 | if isinstance(fname, unicode): | ||
filename = fname.encode(sys.getfilesystemencoding()) | ||||
else: | ||||
filename = fname | ||||
Thomas Ballinger
|
r18526 | where = [ns for ns in [glob, loc] if ns is not None] | ||
if compiler is None: | ||||
builtin_mod.execfile(filename, *where) | ||||
else: | ||||
scripttext = builtin_mod.open(fname).read().rstrip() + '\n' | ||||
exec(compiler(scripttext, filename, 'exec'), glob, loc) | ||||
Thomas Kluyver
|
r13359 | |||
MinRK
|
r15146 | |||
Scott Sanderson
|
r21803 | PY2 = not PY3 | ||
MinRK
|
r15146 | def annotate(**kwargs): | ||
"""Python 3 compatible function annotation for Python 2.""" | ||||
if not kwargs: | ||||
raise ValueError('annotations must be provided as keyword arguments') | ||||
def dec(f): | ||||
if hasattr(f, '__annotations__'): | ||||
for k, v in kwargs.items(): | ||||
f.__annotations__[k] = v | ||||
else: | ||||
f.__annotations__ = kwargs | ||||
return f | ||||
return dec | ||||
Thomas Kluyver
|
r13359 | # Parts below taken from six: | ||
# Copyright (c) 2010-2013 Benjamin Peterson | ||||
# | ||||
# Permission is hereby granted, free of charge, to any person obtaining a copy | ||||
# of this software and associated documentation files (the "Software"), to deal | ||||
# in the Software without restriction, including without limitation the rights | ||||
# to use, copy, modify, merge, publish, distribute, sublicense, and/or sell | ||||
# copies of the Software, and to permit persons to whom the Software is | ||||
# furnished to do so, subject to the following conditions: | ||||
# | ||||
# The above copyright notice and this permission notice shall be included in all | ||||
# copies or substantial portions of the Software. | ||||
# | ||||
# THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR | ||||
# IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, | ||||
# FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE | ||||
# AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER | ||||
# LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, | ||||
# OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE | ||||
# SOFTWARE. | ||||
def with_metaclass(meta, *bases): | ||||
"""Create a base class with a metaclass.""" | ||||
Thomas Kluyver
|
r13584 | return meta("_NewBase", bases, {}) | ||