upstream/mercurial-mirror Commit - r11748:37a70a78

py3kcompat: added a "compatibility layer" for py3k...

Renato Cunha -

r11748:37a70a78 default

parent child

mercurial/py3kcompat.py

0 created 644 +65 0

			@@ -0,0 +1,65 b''
		1	# py3kcompat.py - compatibility definitions for running hg in py3k
		2	#
		3	# Copyright 2010 Renato Cunha <renatoc@gmail.com>
		4	#
		5	# This software may be used and distributed according to the terms of the
		6	# GNU General Public License version 2 or any later version.
		7
		8	import os, builtins
		9
		10	from numbers import Number
		11
		12	def bytesformatter(format, args):
		13	'''Custom implementation of a formatter for bytestrings.
		14
		15	This function currently relias on the string formatter to do the
		16	formatting and always returns bytes objects.
		17
		18	>>> bytesformatter(20, 10)
		19	0
		20	>>> bytesformatter('unicode %s, %s!', ('string', 'foo'))
		21	b'unicode string, foo!'
		22	>>> bytesformatter(b'test %s', 'me')
		23	b'test me'
		24	>>> bytesformatter('test %s', 'me')
		25	b'test me'
		26	>>> bytesformatter(b'test %s', b'me')
		27	b'test me'
		28	>>> bytesformatter('test %s', b'me')
		29	b'test me'
		30	>>> bytesformatter('test %d: %s', (1, b'result'))
		31	b'test 1: result'
		32	'''
		33	# The current implementation just converts from bytes to unicode, do
		34	# what's needed and then convert the results back to bytes.
		35	# Another alternative is to use the Python C API implementation.
		36	if isinstance(format, Number):
		37	# If the fixer erroneously passes a number remainder operation to
		38	# bytesformatter, we just return the correct operation
		39	return format % args
		40	if isinstance(format, bytes):
		41	format = format.decode('utf-8', 'surrogateescape')
		42	if isinstance(args, bytes):
		43	args = args.decode('utf-8', 'surrogateescape')
		44	if isinstance(args, tuple):
		45	newargs = []
		46	for arg in args:
		47	if isinstance(arg, bytes):
		48	arg = arg.decode('utf-8', 'surrogateescape')
		49	newargs.append(arg)
		50	args = tuple(newargs)
		51	ret = format % args
		52	return ret.encode('utf-8', 'surrogateescape')
		53	builtins.bytesformatter = bytesformatter
		54
		55	# Create bytes equivalents for os.environ values
		56	for key in list(os.environ.keys()):
		57	# UTF-8 is fine for us
		58	bkey = key.encode('utf-8', 'surrogateescape')
		59	bvalue = os.environ[key].encode('utf-8', 'surrogateescape')
		60	os.environ[bkey] = bvalue
		61
		62	if __name__ == '__main__':
		63	import doctest
		64	doctest.testmod()
		65

contrib/hgfixes/fix_bytes.py

0 +1 0

              """Fixer that changes plain strings to bytes strings."""
              import re
              from lib2to3 import fixer_base
              from lib2to3.pgen2 import token
              from lib2to3.fixer_util import Name
              from lib2to3.pygram import python_symbols as syms
              _re = re.compile(r'[rR]?[\'\"]')
              # XXX: Implementing a blacklist in 2to3 turned out to be more troublesome than
              # blacklisting some modules inside the fixers. So, this is what I came with.
              blacklist = ['mercurial/demandimport.py',
+                          'mercurial/py3kcompat.py', # valid python 3 already
                           'mercurial/i18n.py',
                          ]
              def isdocstring(node):
                  def isclassorfunction(ancestor):
                      symbols = (syms.funcdef, syms.classdef)
                      # if the current node is a child of a function definition, a class
                      # definition or a file, then it is a docstring
                      if ancestor.type == syms.simple_stmt:
                          try:
                              while True:
                                  if ancestor.type in symbols:
                                      return True
                                  ancestor = ancestor.parent
                          except AttributeError:
                              return False
                      return False
                  def ismodule(ancestor):
                      # Our child is a docstring if we are a simple statement, and our
                      # ancestor is file_input. In other words, our child is a lone string in
                      # the source file.
                      try:
                          if (ancestor.type == syms.simple_stmt and
                              ancestor.parent.type == syms.file_input):
                                  return True
                      except AttributeError:
                          return False
                  def isdocassignment(ancestor):
                      # Assigning to __doc__, definitely a string
                      try:
                          while True:
                              if (ancestor.type == syms.expr_stmt and
                                  Name('__doc__') in ancestor.children):
                                      return True
                              ancestor = ancestor.parent
                      except AttributeError:
                          return False
                  if ismodule(node.parent) or \
                     isdocassignment(node.parent) or \
                     isclassorfunction(node.parent):
                      return True
                  return False
              def shouldtransform(node):
                  specialnames = ['__main__']
                  if node.value in specialnames:
                      return False
                  ggparent = node.parent.parent.parent
                  sggparent = str(ggparent)
                  if 'getattr' in sggparent or \
                     'hasattr' in sggparent or \
                     'setattr' in sggparent or \
                     'encode' in sggparent or \
                     'decode' in sggparent:
                         return False
                  return True
              class FixBytes(fixer_base.BaseFix):
                  PATTERN = 'STRING'
                  def transform(self, node, results):
                      if self.filename in blacklist:
                          return
                      if node.type == token.STRING:
                          if _re.match(node.value):
                              if isdocstring(node):
                                  return
                              if not shouldtransform(node):
                                  return
                              new = node.clone()
                              new.value = 'b' + new.value
                              return new

General Comments 0

Write
Preview

You need to be logged in to leave comments. Login now

No TODOs yet

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages