upstream/ipython Commit - r3459:a6a9d580

Merge branch 'unicode-issues'

Thomas Kluyver -

r3459:a6a9d580

parent child

IPython/core/tests/test_application.py

0 created 644 +68 0

@@ -0,0 +1,68 b''
	1	# coding: utf-8
	2	"""Tests for IPython.core.application"""
	3
	4	import os
	5	import tempfile
	6
	7	from IPython.core.application import Application
	8
	9	def test_unicode_cwd():
	10	"""Check that IPython starts with non-ascii characters in the path."""
	11	wd = tempfile.mkdtemp(suffix=u"€")
	12
	13	old_wd = os.getcwdu()
	14	os.chdir(wd)
	15	#raise Exception(repr(os.getcwd()))
	16	try:
	17	app = Application()
	18	# The lines below are copied from Application.initialize()
	19	app.create_default_config()
	20	app.log_default_config()
	21	app.set_default_config_log_level()
	22
	23	# Find resources needed for filesystem access, using information from
	24	# the above two
	25	app.find_ipython_dir()
	26	app.find_resources()
	27	app.find_config_file_name()
	28	app.find_config_file_paths()
	29
	30	# File-based config
	31	app.pre_load_file_config()
	32	app.load_file_config(suppress_errors=False)
	33	finally:
	34	os.chdir(old_wd)
	35
	36	def test_unicode_ipdir():
	37	"""Check that IPython starts with non-ascii characters in the IP dir."""
	38	ipdir = tempfile.mkdtemp(suffix=u"€")
	39
	40	# Create the config file, so it tries to load it.
	41	with open(os.path.join(ipdir, 'ipython_config.py'), "w") as f:
	42	pass
	43
	44	old_ipdir1 = os.environ.pop("IPYTHONDIR", None)
	45	old_ipdir2 = os.environ.pop("IPYTHON_DIR", None)
	46	os.environ["IPYTHONDIR"] = ipdir.encode("utf-8")
	47	try:
	48	app = Application()
	49	# The lines below are copied from Application.initialize()
	50	app.create_default_config()
	51	app.log_default_config()
	52	app.set_default_config_log_level()
	53
	54	# Find resources needed for filesystem access, using information from
	55	# the above two
	56	app.find_ipython_dir()
	57	app.find_resources()
	58	app.find_config_file_name()
	59	app.find_config_file_paths()
	60
	61	# File-based config
	62	app.pre_load_file_config()
	63	app.load_file_config(suppress_errors=False)
	64	finally:
	65	if old_ipdir1:
	66	os.environ["IPYTHONDIR"] = old_ipdir1
	67	if old_ipdir2:
	68	os.environ["IPYTHONDIR"] = old_ipdir2

IPython/config/loader.py

0 +3 -1

                         return self.config
                     namespace = dict(load_subconfig=load_subconfig, get_config=get_config)
-                    execfile(self.full_filename, namespace)
+                    fs_encoding = sys.getfilesystemencoding() or 'ascii'
+                    conf_filename = self.full_filename.encode(fs_encoding)
+                    execfile(conf_filename, namespace)
                 def _convert_to_config(self):
                     if self.data is None:

IPython/core/application.py

0 +8 -2

                     # our shipped copies of builtin profiles even if they don't have them
                     # in their local ipython directory.
                     prof_dir = os.path.join(get_ipython_package_dir(), 'config', 'profile')
-                    self.config_file_paths = (os.getcwd(), self.ipython_dir, prof_dir)
+                    self.config_file_paths = (os.getcwdu(), self.ipython_dir, prof_dir)
                 def pre_load_file_config(self):
                     """Do actions before the config file is loaded."""
                     pass
-                def load_file_config(self):
+                def load_file_config(self, suppress_errors=True):
                     """Load the config file.
                     This tries to load the config file from disk.  If successful, the
                     ``CONFIG_FILE`` config variable is set to the resolved config file
                     location.  If not successful, an empty config is used.
+                    By default, errors in loading config are handled, and a warning
+                    printed on screen. For testing, the suppress_errors option is set
+                    to False, so errors will make tests fail.
                     """
                     self.log.debug("Attempting to load config file: %s" %
                                    self.config_file_name)
                                            self.config_file_name, exc_info=True)
                         self.file_config = Config()
                     except:
+                        if not suppress_errors:     # For testing purposes
+                            raise
                         self.log.warn("Error loading config file: %s" %
                                       self.config_file_name, exc_info=True)
                         self.file_config = Config()

IPython/core/compilerop.py

0 +3 -1

             def code_name(code, number=0):
                 """ Compute a (probably) unique name for code for caching.
+                This now expects code to be unicode.
                 """
-                hash_digest = hashlib.md5(code).hexdigest()
+                hash_digest = hashlib.md5(code.encode("utf-8")).hexdigest()
                 # Include the number and 12 characters of the hash in the name.  It's
                 # pretty much impossible that in a single session we'll have collisions
                 # even with truncated hashes, and the full one makes tracebacks too long

IPython/core/inputsplitter.py

0 +5 -21

             # Imports
             #-----------------------------------------------------------------------------
             # stdlib
+            import ast
             import codeop
             import re
             import sys
                 commands : list of str
                     Separate commands that can be exec'ed independently.
                 """
-                import compiler
                 # compiler.parse treats trailing spaces after a newline as a
                 # SyntaxError.  This is different than codeop.CommandCompiler, which
                 # will compile the trailng spaces just fine.  We simply strip any
                 python_ori = python # save original in case we bail on error
                 python = python.strip()
-                # The compiler module does not like unicode. We need to convert
-                # it encode it:
-                if isinstance(python, unicode):
-                    # Use the utf-8-sig BOM so the compiler detects this a UTF-8
-                    # encode string.
-                    python = '\xef\xbb\xbf' + python.encode('utf-8')
                 # The compiler module will parse the code into an abstract syntax tree.
                 # This has a bug with str("a\nb"), but not str("""a\nb""")!!!
                 try:
-                    ast = compiler.parse(python)
+                    code_ast = ast.parse(python)
                 except:
                     return [python_ori]
                 # Uncomment to help debug the ast tree
-                # for n in ast.node:
+                # for n in code_ast.body:
                 #     print n.lineno,'->',n
                 # Each separate command is available by iterating over ast.node. The
                 # other situations that cause Discard nodes that shouldn't be discarded.
                 # We might eventually discover other cases where lineno is None and have
                 # to put in a more sophisticated test.
-                linenos = [x.lineno-1 for x in ast.node if x.lineno is not None]
+                linenos = [x.lineno-1 for x in code_ast.body if x.lineno is not None]
-                # When we have a bare string as the first statement, it does not end up as
-                # a Discard Node in the AST as we might expect. Instead, it gets interpreted
-                # as the docstring of the module. Check for this case and prepend 0 (the
-                # first line number) to the list of linenos to account for it.
-                if ast.doc is not None:
-                    linenos.insert(0, 0)
                 # When we finally get the slices, we will need to slice all the way to
                 # the end even though we don't have a line number for it. Fortunately,
                     setattr(self, store, self._set_source(buffer))
                 def _set_source(self, buffer):
-                    return ''.join(buffer).encode(self.encoding)
+                    return u''.join(buffer)
             #-----------------------------------------------------------------------------

IPython/core/interactiveshell.py

0 +4 -3

                         # otherwise we end up with a monster history after a while:
                         readline.set_history_length(self.history_length)
+                        stdin_encoding = sys.stdin.encoding or "utf-8"
                         # Load the last 1000 lines from history
                         for _, _, cell in self.history_manager.get_tail(1000,
                                                             include_latest=True):
                             if cell.strip(): # Ignore blank lines
                                 for line in cell.splitlines():
-                                    readline.add_history(line)
+                                    readline.add_history(line.encode(stdin_encoding))
                     # Configure auto-indent for all platforms
                     self.set_autoindent(self.autoindent)
                         cell = self.prefilter_manager.prefilter_line(blocks[0])
                         blocks = self.input_splitter.split_blocks(cell)
                     # Store the 'ipython' version of the cell as well, since that's what
                     # needs to go into the translated history and get executed (the
                     # original cell may contain non-python syntax).
                     else:
                         usource = source
-                    if 0:  # dbg
+                    if False:  # dbg
                         print 'Source:', repr(source)  # dbg
                         print 'USource:', repr(usource)  # dbg
                         print 'type:', type(source) # dbg

IPython/core/magic.py

0 +2 -1

                             return
                     cmds = self.extract_input_lines(ranges, 'r' in opts)
                     with open(fname,'w') as f:
-                        f.write(cmds)
+                        f.write("# coding: utf-8\n")
+                        f.write(cmds.encode("utf-8"))
                     print 'The following commands were written to file `%s`:' % fname
                     print cmds

IPython/core/tests/test_compilerop.py

0 +12 0

+            # coding: utf-8
             """Tests for the compilerop module.
             """
             #-----------------------------------------------------------------------------
             # Stdlib imports
             import linecache
+            import sys
             # Third-party imports
             import nose.tools as nt
                 cp('x=1', 'single')
                 nt.assert_true(len(linecache.cache) > ncache)
+            def setUp():
+                # Check we're in a proper Python 2 environment (some imports, such
+                # as GTK, can change the default encoding, which can hide bugs.)
+                nt.assert_equal(sys.getdefaultencoding(), "ascii")
+            def test_compiler_unicode():
+                cp = compilerop.CachingCompiler()
+                ncache = len(linecache.cache)
+                cp(u"t = 'žćčšđ'", "single")
+                nt.assert_true(len(linecache.cache) > ncache)
             def test_compiler_check_cache():
                 """Test the compiler properly manages the cache.

IPython/core/tests/test_history.py

0 +8 -3

+            # coding: utf-8
             """Tests for the IPython tab-completion machinery.
             """
             #-----------------------------------------------------------------------------
             from IPython.utils.tempdir import TemporaryDirectory
             from IPython.core.history import HistoryManager, extract_hist_ranges
-            def test_history():
+            def setUp():
+                nt.assert_equal(sys.getdefaultencoding(), "ascii")
+            def test_history():
                 ip = get_ipython()
                 with TemporaryDirectory() as tmpdir:
                     #tmpdir = '/software/temp'
                         ip.history_manager.init_db()  # Has to be called after changing file
                         ip.history_manager.reset()
                         print 'test',histfile
-                        hist = ['a=1', 'def f():\n    test = 1\n    return test', 'b=2']
+                        hist = ['a=1', 'def f():\n    test = 1\n    return test', u"b='€Æ¾÷ß'"]
                         for i, h in enumerate(hist, start=1):
                             ip.history_manager.store_inputs(i, h)
                         testfilename = os.path.realpath(os.path.join(tmpdir, "test.py"))
                         ip.magic_save(testfilename + " ~1/1-3")
                         testfile = open(testfilename, "r")
-                        nt.assert_equal(testfile.read(), "\n".join(hist))
+                        nt.assert_equal(testfile.read().decode("utf-8"),
+                                "# coding: utf-8\n" + "\n".join(hist))
                         # Duplicate line numbers - check that it doesn't crash, and
                         # gets a new session
                         # Restore history manager
                         ip.history_manager = hist_manager_ori
             def test_extract_hist_ranges():
                 instr = "1 2/3 ~4/5-6 ~4/7-~4/9 ~9/2-~7/5"
                 expected = [(0, 1, 2),  # 0 == current session

IPython/core/tests/test_inputsplitter.py

0 +1 -1

                 def test_unicode(self):
                     self.isp.push(u"Pérez")
                     self.isp.push(u'\xc3\xa9')
-                    self.isp.push("u'\xc3\xa9'")
+                    self.isp.push(u"u'\xc3\xa9'")
             class InteractiveLoopTestCase(unittest.TestCase):
                 """Tests for an interactive loop like a python shell.

IPython/core/tests/test_magic.py

0 +2 -2

             def test_dirops():
                 """Test various directory handling operations."""
-                curpath = lambda :os.path.splitdrive(os.getcwd())[1].replace('\\','/')
+                curpath = lambda :os.path.splitdrive(os.getcwdu())[1].replace('\\','/')
-                startdir = os.getcwd()
+                startdir = os.getcwdu()
                 ipdir = _ip.ipython_dir
                 try:
                     _ip.magic('cd "%s"' % ipdir)

IPython/testing/iptest.py

0 +2 -3

             have['twisted'] = test_for('twisted')
             have['foolscap'] = test_for('foolscap')
             have['pexpect'] = test_for('pexpect')
-            have['gtk'] = test_for('gtk')
-            have['gobject'] = test_for('gobject')
             #-----------------------------------------------------------------------------
             # Functions and classes
                 if not have['wx']:
                     exclusions.append(ipjoin('lib', 'inputhookwx'))
-                if not have['gtk'] or not have['gobject']:
+                # We do this unconditionally, so that the test suite doesn't import
+                # gtk, changing the default encoding and masking some unicode bugs.
                 exclusions.append(ipjoin('lib', 'inputhookgtk'))
                 # These have to be skipped on win32 because the use echo, rm, cd, etc.

General Comments 0

Write
Preview

You need to be logged in to leave comments. Login now

No TODOs yet

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages