Show More
@@ -0,0 +1,65 b'' | |||
|
1 | # py3kcompat.py - compatibility definitions for running hg in py3k | |
|
2 | # | |
|
3 | # Copyright 2010 Renato Cunha <renatoc@gmail.com> | |
|
4 | # | |
|
5 | # This software may be used and distributed according to the terms of the | |
|
6 | # GNU General Public License version 2 or any later version. | |
|
7 | ||
|
8 | import os, builtins | |
|
9 | ||
|
10 | from numbers import Number | |
|
11 | ||
|
12 | def bytesformatter(format, args): | |
|
13 | '''Custom implementation of a formatter for bytestrings. | |
|
14 | ||
|
15 | This function currently relias on the string formatter to do the | |
|
16 | formatting and always returns bytes objects. | |
|
17 | ||
|
18 | >>> bytesformatter(20, 10) | |
|
19 | 0 | |
|
20 | >>> bytesformatter('unicode %s, %s!', ('string', 'foo')) | |
|
21 | b'unicode string, foo!' | |
|
22 | >>> bytesformatter(b'test %s', 'me') | |
|
23 | b'test me' | |
|
24 | >>> bytesformatter('test %s', 'me') | |
|
25 | b'test me' | |
|
26 | >>> bytesformatter(b'test %s', b'me') | |
|
27 | b'test me' | |
|
28 | >>> bytesformatter('test %s', b'me') | |
|
29 | b'test me' | |
|
30 | >>> bytesformatter('test %d: %s', (1, b'result')) | |
|
31 | b'test 1: result' | |
|
32 | ''' | |
|
33 | # The current implementation just converts from bytes to unicode, do | |
|
34 | # what's needed and then convert the results back to bytes. | |
|
35 | # Another alternative is to use the Python C API implementation. | |
|
36 | if isinstance(format, Number): | |
|
37 | # If the fixer erroneously passes a number remainder operation to | |
|
38 | # bytesformatter, we just return the correct operation | |
|
39 | return format % args | |
|
40 | if isinstance(format, bytes): | |
|
41 | format = format.decode('utf-8', 'surrogateescape') | |
|
42 | if isinstance(args, bytes): | |
|
43 | args = args.decode('utf-8', 'surrogateescape') | |
|
44 | if isinstance(args, tuple): | |
|
45 | newargs = [] | |
|
46 | for arg in args: | |
|
47 | if isinstance(arg, bytes): | |
|
48 | arg = arg.decode('utf-8', 'surrogateescape') | |
|
49 | newargs.append(arg) | |
|
50 | args = tuple(newargs) | |
|
51 | ret = format % args | |
|
52 | return ret.encode('utf-8', 'surrogateescape') | |
|
53 | builtins.bytesformatter = bytesformatter | |
|
54 | ||
|
55 | # Create bytes equivalents for os.environ values | |
|
56 | for key in list(os.environ.keys()): | |
|
57 | # UTF-8 is fine for us | |
|
58 | bkey = key.encode('utf-8', 'surrogateescape') | |
|
59 | bvalue = os.environ[key].encode('utf-8', 'surrogateescape') | |
|
60 | os.environ[bkey] = bvalue | |
|
61 | ||
|
62 | if __name__ == '__main__': | |
|
63 | import doctest | |
|
64 | doctest.testmod() | |
|
65 |
@@ -1,96 +1,97 b'' | |||
|
1 | 1 | """Fixer that changes plain strings to bytes strings.""" |
|
2 | 2 | |
|
3 | 3 | import re |
|
4 | 4 | |
|
5 | 5 | from lib2to3 import fixer_base |
|
6 | 6 | from lib2to3.pgen2 import token |
|
7 | 7 | from lib2to3.fixer_util import Name |
|
8 | 8 | from lib2to3.pygram import python_symbols as syms |
|
9 | 9 | |
|
10 | 10 | _re = re.compile(r'[rR]?[\'\"]') |
|
11 | 11 | |
|
12 | 12 | # XXX: Implementing a blacklist in 2to3 turned out to be more troublesome than |
|
13 | 13 | # blacklisting some modules inside the fixers. So, this is what I came with. |
|
14 | 14 | |
|
15 | 15 | blacklist = ['mercurial/demandimport.py', |
|
16 | 'mercurial/py3kcompat.py', # valid python 3 already | |
|
16 | 17 | 'mercurial/i18n.py', |
|
17 | 18 | ] |
|
18 | 19 | |
|
19 | 20 | def isdocstring(node): |
|
20 | 21 | def isclassorfunction(ancestor): |
|
21 | 22 | symbols = (syms.funcdef, syms.classdef) |
|
22 | 23 | # if the current node is a child of a function definition, a class |
|
23 | 24 | # definition or a file, then it is a docstring |
|
24 | 25 | if ancestor.type == syms.simple_stmt: |
|
25 | 26 | try: |
|
26 | 27 | while True: |
|
27 | 28 | if ancestor.type in symbols: |
|
28 | 29 | return True |
|
29 | 30 | ancestor = ancestor.parent |
|
30 | 31 | except AttributeError: |
|
31 | 32 | return False |
|
32 | 33 | return False |
|
33 | 34 | |
|
34 | 35 | def ismodule(ancestor): |
|
35 | 36 | # Our child is a docstring if we are a simple statement, and our |
|
36 | 37 | # ancestor is file_input. In other words, our child is a lone string in |
|
37 | 38 | # the source file. |
|
38 | 39 | try: |
|
39 | 40 | if (ancestor.type == syms.simple_stmt and |
|
40 | 41 | ancestor.parent.type == syms.file_input): |
|
41 | 42 | return True |
|
42 | 43 | except AttributeError: |
|
43 | 44 | return False |
|
44 | 45 | |
|
45 | 46 | def isdocassignment(ancestor): |
|
46 | 47 | # Assigning to __doc__, definitely a string |
|
47 | 48 | try: |
|
48 | 49 | while True: |
|
49 | 50 | if (ancestor.type == syms.expr_stmt and |
|
50 | 51 | Name('__doc__') in ancestor.children): |
|
51 | 52 | return True |
|
52 | 53 | ancestor = ancestor.parent |
|
53 | 54 | except AttributeError: |
|
54 | 55 | return False |
|
55 | 56 | |
|
56 | 57 | if ismodule(node.parent) or \ |
|
57 | 58 | isdocassignment(node.parent) or \ |
|
58 | 59 | isclassorfunction(node.parent): |
|
59 | 60 | return True |
|
60 | 61 | return False |
|
61 | 62 | |
|
62 | 63 | def shouldtransform(node): |
|
63 | 64 | specialnames = ['__main__'] |
|
64 | 65 | |
|
65 | 66 | if node.value in specialnames: |
|
66 | 67 | return False |
|
67 | 68 | |
|
68 | 69 | ggparent = node.parent.parent.parent |
|
69 | 70 | sggparent = str(ggparent) |
|
70 | 71 | |
|
71 | 72 | if 'getattr' in sggparent or \ |
|
72 | 73 | 'hasattr' in sggparent or \ |
|
73 | 74 | 'setattr' in sggparent or \ |
|
74 | 75 | 'encode' in sggparent or \ |
|
75 | 76 | 'decode' in sggparent: |
|
76 | 77 | return False |
|
77 | 78 | |
|
78 | 79 | return True |
|
79 | 80 | |
|
80 | 81 | class FixBytes(fixer_base.BaseFix): |
|
81 | 82 | |
|
82 | 83 | PATTERN = 'STRING' |
|
83 | 84 | |
|
84 | 85 | def transform(self, node, results): |
|
85 | 86 | if self.filename in blacklist: |
|
86 | 87 | return |
|
87 | 88 | if node.type == token.STRING: |
|
88 | 89 | if _re.match(node.value): |
|
89 | 90 | if isdocstring(node): |
|
90 | 91 | return |
|
91 | 92 | if not shouldtransform(node): |
|
92 | 93 | return |
|
93 | 94 | new = node.clone() |
|
94 | 95 | new.value = 'b' + new.value |
|
95 | 96 | return new |
|
96 | 97 |
General Comments 0
You need to be logged in to leave comments.
Login now