##// END OF EJS Templates
py3kcompat: added a "compatibility layer" for py3k...
Renato Cunha -
r11748:37a70a78 default
parent child Browse files
Show More
@@ -0,0 +1,65 b''
1 # py3kcompat.py - compatibility definitions for running hg in py3k
2 #
3 # Copyright 2010 Renato Cunha <renatoc@gmail.com>
4 #
5 # This software may be used and distributed according to the terms of the
6 # GNU General Public License version 2 or any later version.
7
8 import os, builtins
9
10 from numbers import Number
11
12 def bytesformatter(format, args):
13 '''Custom implementation of a formatter for bytestrings.
14
15 This function currently relias on the string formatter to do the
16 formatting and always returns bytes objects.
17
18 >>> bytesformatter(20, 10)
19 0
20 >>> bytesformatter('unicode %s, %s!', ('string', 'foo'))
21 b'unicode string, foo!'
22 >>> bytesformatter(b'test %s', 'me')
23 b'test me'
24 >>> bytesformatter('test %s', 'me')
25 b'test me'
26 >>> bytesformatter(b'test %s', b'me')
27 b'test me'
28 >>> bytesformatter('test %s', b'me')
29 b'test me'
30 >>> bytesformatter('test %d: %s', (1, b'result'))
31 b'test 1: result'
32 '''
33 # The current implementation just converts from bytes to unicode, do
34 # what's needed and then convert the results back to bytes.
35 # Another alternative is to use the Python C API implementation.
36 if isinstance(format, Number):
37 # If the fixer erroneously passes a number remainder operation to
38 # bytesformatter, we just return the correct operation
39 return format % args
40 if isinstance(format, bytes):
41 format = format.decode('utf-8', 'surrogateescape')
42 if isinstance(args, bytes):
43 args = args.decode('utf-8', 'surrogateescape')
44 if isinstance(args, tuple):
45 newargs = []
46 for arg in args:
47 if isinstance(arg, bytes):
48 arg = arg.decode('utf-8', 'surrogateescape')
49 newargs.append(arg)
50 args = tuple(newargs)
51 ret = format % args
52 return ret.encode('utf-8', 'surrogateescape')
53 builtins.bytesformatter = bytesformatter
54
55 # Create bytes equivalents for os.environ values
56 for key in list(os.environ.keys()):
57 # UTF-8 is fine for us
58 bkey = key.encode('utf-8', 'surrogateescape')
59 bvalue = os.environ[key].encode('utf-8', 'surrogateescape')
60 os.environ[bkey] = bvalue
61
62 if __name__ == '__main__':
63 import doctest
64 doctest.testmod()
65
@@ -1,96 +1,97 b''
1 1 """Fixer that changes plain strings to bytes strings."""
2 2
3 3 import re
4 4
5 5 from lib2to3 import fixer_base
6 6 from lib2to3.pgen2 import token
7 7 from lib2to3.fixer_util import Name
8 8 from lib2to3.pygram import python_symbols as syms
9 9
10 10 _re = re.compile(r'[rR]?[\'\"]')
11 11
12 12 # XXX: Implementing a blacklist in 2to3 turned out to be more troublesome than
13 13 # blacklisting some modules inside the fixers. So, this is what I came with.
14 14
15 15 blacklist = ['mercurial/demandimport.py',
16 'mercurial/py3kcompat.py', # valid python 3 already
16 17 'mercurial/i18n.py',
17 18 ]
18 19
19 20 def isdocstring(node):
20 21 def isclassorfunction(ancestor):
21 22 symbols = (syms.funcdef, syms.classdef)
22 23 # if the current node is a child of a function definition, a class
23 24 # definition or a file, then it is a docstring
24 25 if ancestor.type == syms.simple_stmt:
25 26 try:
26 27 while True:
27 28 if ancestor.type in symbols:
28 29 return True
29 30 ancestor = ancestor.parent
30 31 except AttributeError:
31 32 return False
32 33 return False
33 34
34 35 def ismodule(ancestor):
35 36 # Our child is a docstring if we are a simple statement, and our
36 37 # ancestor is file_input. In other words, our child is a lone string in
37 38 # the source file.
38 39 try:
39 40 if (ancestor.type == syms.simple_stmt and
40 41 ancestor.parent.type == syms.file_input):
41 42 return True
42 43 except AttributeError:
43 44 return False
44 45
45 46 def isdocassignment(ancestor):
46 47 # Assigning to __doc__, definitely a string
47 48 try:
48 49 while True:
49 50 if (ancestor.type == syms.expr_stmt and
50 51 Name('__doc__') in ancestor.children):
51 52 return True
52 53 ancestor = ancestor.parent
53 54 except AttributeError:
54 55 return False
55 56
56 57 if ismodule(node.parent) or \
57 58 isdocassignment(node.parent) or \
58 59 isclassorfunction(node.parent):
59 60 return True
60 61 return False
61 62
62 63 def shouldtransform(node):
63 64 specialnames = ['__main__']
64 65
65 66 if node.value in specialnames:
66 67 return False
67 68
68 69 ggparent = node.parent.parent.parent
69 70 sggparent = str(ggparent)
70 71
71 72 if 'getattr' in sggparent or \
72 73 'hasattr' in sggparent or \
73 74 'setattr' in sggparent or \
74 75 'encode' in sggparent or \
75 76 'decode' in sggparent:
76 77 return False
77 78
78 79 return True
79 80
80 81 class FixBytes(fixer_base.BaseFix):
81 82
82 83 PATTERN = 'STRING'
83 84
84 85 def transform(self, node, results):
85 86 if self.filename in blacklist:
86 87 return
87 88 if node.type == token.STRING:
88 89 if _re.match(node.value):
89 90 if isdocstring(node):
90 91 return
91 92 if not shouldtransform(node):
92 93 return
93 94 new = node.clone()
94 95 new.value = 'b' + new.value
95 96 return new
96 97
General Comments 0
You need to be logged in to leave comments. Login now