upstream/ipython Commit - r8309:aca66064

make source_to_unicode use BytesIO and refactor

JÃ¶rgen Stenarson -

r8309:aca66064

parent child

IPython/utils/openpy.py

0 +22 -16

              from __future__ import absolute_import
              import io
-             from io import TextIOWrapper
+             from io import TextIOWrapper, BytesIO
              import re
-             from StringIO import StringIO
              import urllib
              cookie_re = re.compile(ur"coding[:=]\s*([-\w.]+)", re.UNICODE)
                      text.mode = 'r'
                      return text
-             def source_to_unicode(txt):
-                 """Converts string with python source code to unicode
+             def source_to_unicode(txt, errors='replace', skip_encoding_cookie=True):
+                 """Converts a bytes string with python source code to unicode.
+                 Unicode strings are passed through unchanged. Byte strings are checked
+                 for the python source file encoding cookie to determine encoding.
+                 txt can be either a bytes buffer or a string containing the source
+                 code.
                  """
                  if isinstance(txt, unicode):
                      return txt
+                 if isinstance(txt, str):
+                     buffer = BytesIO(txt)
+                 else:
+                     buffer = txt
                  try:
-                     coding, _ = detect_encoding(StringIO(txt).readline)
+                     encoding, _ = detect_encoding(buffer.readline)
                  except SyntaxError:
-                     coding = "ascii"
-                 return txt.decode(coding, errors="replace")
+                     encoding = "ascii"
+                 buffer.seek(0)
+                 text = TextIOWrapper(buffer, encoding, errors=errors, line_buffering=True)
+                 text.mode = 'r'
+                 if skip_encoding_cookie:
+                     return u"".join(strip_encoding_cookie(text))
+                 else:
+                     return text.read()
              def strip_encoding_cookie(filelike):
                  """Generator to pull lines from a text-mode file, skipping the encoding
                  """
                  response = urllib.urlopen(url)
                  buffer = io.BytesIO(response.read())
-                 encoding, lines = detect_encoding(buffer.readline)
-                 buffer.seek(0)
-                 text = TextIOWrapper(buffer, encoding, errors=errors, line_buffering=True)
-                 text.mode = 'r'
-                 if skip_encoding_cookie:
-                     return "".join(strip_encoding_cookie(text))
-                 else:
-                     return text.read()
+                 return source_to_unicode(buffer, errors, skip_encoding_cookie)

General Comments 0

Write
Preview

You need to be logged in to leave comments. Login now

No TODOs yet

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages