upstream/ipython Commit - r3459:a6a9d580

Merge branch 'unicode-issues'

Thomas Kluyver -

r3459:a6a9d580

parent child

IPython/core/tests/test_application.py

0 created 644 +68 0

			@@ -0,0 +1,68 b''
		1	# coding: utf-8
		2	"""Tests for IPython.core.application"""
		3
		4	import os
		5	import tempfile
		6
		7	from IPython.core.application import Application
		8
		9	def test_unicode_cwd():
		10	"""Check that IPython starts with non-ascii characters in the path."""
		11	wd = tempfile.mkdtemp(suffix=u"€")
		12
		13	old_wd = os.getcwdu()
		14	os.chdir(wd)
		15	#raise Exception(repr(os.getcwd()))
		16	try:
		17	app = Application()
		18	# The lines below are copied from Application.initialize()
		19	app.create_default_config()
		20	app.log_default_config()
		21	app.set_default_config_log_level()
		22
		23	# Find resources needed for filesystem access, using information from
		24	# the above two
		25	app.find_ipython_dir()
		26	app.find_resources()
		27	app.find_config_file_name()
		28	app.find_config_file_paths()
		29
		30	# File-based config
		31	app.pre_load_file_config()
		32	app.load_file_config(suppress_errors=False)
		33	finally:
		34	os.chdir(old_wd)
		35
		36	def test_unicode_ipdir():
		37	"""Check that IPython starts with non-ascii characters in the IP dir."""
		38	ipdir = tempfile.mkdtemp(suffix=u"€")
		39
		40	# Create the config file, so it tries to load it.
		41	with open(os.path.join(ipdir, 'ipython_config.py'), "w") as f:
		42	pass
		43
		44	old_ipdir1 = os.environ.pop("IPYTHONDIR", None)
		45	old_ipdir2 = os.environ.pop("IPYTHON_DIR", None)
		46	os.environ["IPYTHONDIR"] = ipdir.encode("utf-8")
		47	try:
		48	app = Application()
		49	# The lines below are copied from Application.initialize()
		50	app.create_default_config()
		51	app.log_default_config()
		52	app.set_default_config_log_level()
		53
		54	# Find resources needed for filesystem access, using information from
		55	# the above two
		56	app.find_ipython_dir()
		57	app.find_resources()
		58	app.find_config_file_name()
		59	app.find_config_file_paths()
		60
		61	# File-based config
		62	app.pre_load_file_config()
		63	app.load_file_config(suppress_errors=False)
		64	finally:
		65	if old_ipdir1:
		66	os.environ["IPYTHONDIR"] = old_ipdir1
		67	if old_ipdir2:
		68	os.environ["IPYTHONDIR"] = old_ipdir2

IPython/config/loader.py

0 +3 -1

                          return self.config
                      namespace = dict(load_subconfig=load_subconfig, get_config=get_config)
-                     execfile(self.full_filename, namespace)
+                     fs_encoding = sys.getfilesystemencoding() or 'ascii'
+                     conf_filename = self.full_filename.encode(fs_encoding)
+                     execfile(conf_filename, namespace)
                  def _convert_to_config(self):
                      if self.data is None:

IPython/core/application.py

0 +8 -2

                      # our shipped copies of builtin profiles even if they don't have them
                      # in their local ipython directory.
                      prof_dir = os.path.join(get_ipython_package_dir(), 'config', 'profile')
-                     self.config_file_paths = (os.getcwd(), self.ipython_dir, prof_dir)
+                     self.config_file_paths = (os.getcwdu(), self.ipython_dir, prof_dir)
                  def pre_load_file_config(self):
                      """Do actions before the config file is loaded."""
                      pass
-                 def load_file_config(self):
+                 def load_file_config(self, suppress_errors=True):
                      """Load the config file.
                      This tries to load the config file from disk.  If successful, the
                      ``CONFIG_FILE`` config variable is set to the resolved config file
                      location.  If not successful, an empty config is used.
+                     By default, errors in loading config are handled, and a warning
+                     printed on screen. For testing, the suppress_errors option is set
+                     to False, so errors will make tests fail.
                      """
                      self.log.debug("Attempting to load config file: %s" %
                                     self.config_file_name)
                                             self.config_file_name, exc_info=True)
                          self.file_config = Config()
                      except:
+                         if not suppress_errors:     # For testing purposes
+                             raise
                          self.log.warn("Error loading config file: %s" %
                                        self.config_file_name, exc_info=True)
                          self.file_config = Config()

IPython/core/compilerop.py

0 +3 -1

              def code_name(code, number=0):
                  """ Compute a (probably) unique name for code for caching.
+                 This now expects code to be unicode.
                  """
-                 hash_digest = hashlib.md5(code).hexdigest()
+                 hash_digest = hashlib.md5(code.encode("utf-8")).hexdigest()
                  # Include the number and 12 characters of the hash in the name.  It's
                  # pretty much impossible that in a single session we'll have collisions
                  # even with truncated hashes, and the full one makes tracebacks too long

IPython/core/inputsplitter.py

0 +6 -22

              # Imports
              #-----------------------------------------------------------------------------
              # stdlib
+             import ast
              import codeop
              import re
              import sys
                  commands : list of str
                      Separate commands that can be exec'ed independently.
                  """
-                 import compiler
                  # compiler.parse treats trailing spaces after a newline as a
                  # SyntaxError.  This is different than codeop.CommandCompiler, which
                  # will compile the trailng spaces just fine.  We simply strip any
                  python_ori = python # save original in case we bail on error
                  python = python.strip()
-                 # The compiler module does not like unicode. We need to convert
-                 # it encode it:
-                 if isinstance(python, unicode):
-                     # Use the utf-8-sig BOM so the compiler detects this a UTF-8
-                     # encode string.
-                     python = '\xef\xbb\xbf' + python.encode('utf-8')
                  # The compiler module will parse the code into an abstract syntax tree.
                  # This has a bug with str("a\nb"), but not str("""a\nb""")!!!
                  try:
-                     ast = compiler.parse(python)
+                     code_ast = ast.parse(python)
                  except:
                      return [python_ori]
                  # Uncomment to help debug the ast tree
-                 # for n in ast.node:
+                 # for n in code_ast.body:
                  #     print n.lineno,'->',n
                  # Each separate command is available by iterating over ast.node. The
                  # other situations that cause Discard nodes that shouldn't be discarded.
                  # We might eventually discover other cases where lineno is None and have
                  # to put in a more sophisticated test.
-                 linenos = [x.lineno-1 for x in ast.node if x.lineno is not None]
-                 # When we have a bare string as the first statement, it does not end up as
-                 # a Discard Node in the AST as we might expect. Instead, it gets interpreted
-                 # as the docstring of the module. Check for this case and prepend 0 (the
-                 # first line number) to the list of linenos to account for it.
-                 if ast.doc is not None:
-                     linenos.insert(0, 0)
+                 linenos = [x.lineno-1 for x in code_ast.body if x.lineno is not None]
                  # When we finally get the slices, we will need to slice all the way to
                  # the end even though we don't have a line number for it. Fortunately,
                      If input lines are not newline-terminated, a newline is automatically
                      appended."""
                      if buffer is None:
                          buffer = self._buffer
                      setattr(self, store, self._set_source(buffer))
                  def _set_source(self, buffer):
-                     return ''.join(buffer).encode(self.encoding)
+                     return u''.join(buffer)
              #-----------------------------------------------------------------------------

IPython/core/interactiveshell.py

0 +4 -3

                          # otherwise we end up with a monster history after a while:
                          readline.set_history_length(self.history_length)
+                         stdin_encoding = sys.stdin.encoding or "utf-8"
                          # Load the last 1000 lines from history
                          for _, _, cell in self.history_manager.get_tail(1000,
                                                              include_latest=True):
                              if cell.strip(): # Ignore blank lines
                                  for line in cell.splitlines():
-                                     readline.add_history(line)
+                                     readline.add_history(line.encode(stdin_encoding))
                      # Configure auto-indent for all platforms
                      self.set_autoindent(self.autoindent)
                      if len(cell.splitlines()) <= 1:
                          cell = self.prefilter_manager.prefilter_line(blocks[0])
                          blocks = self.input_splitter.split_blocks(cell)
                      # Store the 'ipython' version of the cell as well, since that's what
                      # needs to go into the translated history and get executed (the
                      else:
                          usource = source
-                     if 0:  # dbg
+                     if False:  # dbg
                          print 'Source:', repr(source)  # dbg
                          print 'USource:', repr(usource)  # dbg
                          print 'type:', type(source) # dbg

IPython/core/magic.py

0 +2 -1

                              return
                      cmds = self.extract_input_lines(ranges, 'r' in opts)
                      with open(fname,'w') as f:
-                         f.write(cmds)
+                         f.write("# coding: utf-8\n")
+                         f.write(cmds.encode("utf-8"))
                      print 'The following commands were written to file `%s`:' % fname
                      print cmds

IPython/core/tests/test_compilerop.py

0 +12 0

+             # coding: utf-8
              """Tests for the compilerop module.
              """
              #-----------------------------------------------------------------------------
              # Stdlib imports
              import linecache
+             import sys
              # Third-party imports
              import nose.tools as nt
                  cp('x=1', 'single')
                  nt.assert_true(len(linecache.cache) > ncache)
+             def setUp():
+                 # Check we're in a proper Python 2 environment (some imports, such
+                 # as GTK, can change the default encoding, which can hide bugs.)
+                 nt.assert_equal(sys.getdefaultencoding(), "ascii")
+             def test_compiler_unicode():
+                 cp = compilerop.CachingCompiler()
+                 ncache = len(linecache.cache)
+                 cp(u"t = 'žćčšđ'", "single")
+                 nt.assert_true(len(linecache.cache) > ncache)
              def test_compiler_check_cache():
                  """Test the compiler properly manages the cache.

IPython/core/tests/test_history.py

0 +8 -3

+             # coding: utf-8
              """Tests for the IPython tab-completion machinery.
              """
              #-----------------------------------------------------------------------------
              from IPython.utils.tempdir import TemporaryDirectory
              from IPython.core.history import HistoryManager, extract_hist_ranges
-             def test_history():
+             def setUp():
+                 nt.assert_equal(sys.getdefaultencoding(), "ascii")
+             def test_history():
                  ip = get_ipython()
                  with TemporaryDirectory() as tmpdir:
                      #tmpdir = '/software/temp'
                          ip.history_manager.init_db()  # Has to be called after changing file
                          ip.history_manager.reset()
                          print 'test',histfile
-                         hist = ['a=1', 'def f():\n    test = 1\n    return test', 'b=2']
+                         hist = ['a=1', 'def f():\n    test = 1\n    return test', u"b='€Æ¾÷ß'"]
                          for i, h in enumerate(hist, start=1):
                              ip.history_manager.store_inputs(i, h)
                          testfilename = os.path.realpath(os.path.join(tmpdir, "test.py"))
                          ip.magic_save(testfilename + " ~1/1-3")
                          testfile = open(testfilename, "r")
-                         nt.assert_equal(testfile.read(), "\n".join(hist))
+                         nt.assert_equal(testfile.read().decode("utf-8"),
+                                 "# coding: utf-8\n" + "\n".join(hist))
                          # Duplicate line numbers - check that it doesn't crash, and
                          # gets a new session
                          # Restore history manager
                          ip.history_manager = hist_manager_ori
              def test_extract_hist_ranges():
                  instr = "1 2/3 ~4/5-6 ~4/7-~4/9 ~9/2-~7/5"
                  expected = [(0, 1, 2),  # 0 == current session

IPython/core/tests/test_inputsplitter.py

0 +1 -1

                  def test_unicode(self):
                      self.isp.push(u"Pérez")
                      self.isp.push(u'\xc3\xa9')
-                     self.isp.push("u'\xc3\xa9'")
+                     self.isp.push(u"u'\xc3\xa9'")
              class InteractiveLoopTestCase(unittest.TestCase):
                  """Tests for an interactive loop like a python shell.

IPython/core/tests/test_magic.py

0 +2 -2

              def test_dirops():
                  """Test various directory handling operations."""
-                 curpath = lambda :os.path.splitdrive(os.getcwd())[1].replace('\\','/')
+                 curpath = lambda :os.path.splitdrive(os.getcwdu())[1].replace('\\','/')
-                 startdir = os.getcwd()
+                 startdir = os.getcwdu()
                  ipdir = _ip.ipython_dir
                  try:
                      _ip.magic('cd "%s"' % ipdir)

IPython/testing/iptest.py

0 +4 -5

              have['twisted'] = test_for('twisted')
              have['foolscap'] = test_for('foolscap')
              have['pexpect'] = test_for('pexpect')
-             have['gtk'] = test_for('gtk')
-             have['gobject'] = test_for('gobject')
              #-----------------------------------------------------------------------------
              # Functions and classes
                  if not have['wx']:
                      exclusions.append(ipjoin('lib', 'inputhookwx'))
-                 if not have['gtk'] or not have['gobject']:
-                     exclusions.append(ipjoin('lib', 'inputhookgtk'))
+                 # We do this unconditionally, so that the test suite doesn't import
+                 # gtk, changing the default encoding and masking some unicode bugs.
+                 exclusions.append(ipjoin('lib', 'inputhookgtk'))
                  # These have to be skipped on win32 because the use echo, rm, cd, etc.
                  # See ticket https://bugs.launchpad.net/bugs/366982

General Comments 0

Write
Preview

You need to be logged in to leave comments. Login now

No TODOs yet

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages