upstream/ipython Commit - r26615:c20d7a0d

Refactor strip_email_quotes...

Blazej Michalik -

r26615:c20d7a0d

parent child

IPython/utils/tests/test_text.py

0 0 -13

                  nt.assert_equal(s, "$HOME")
-             def test_long_substr():
-                 data = ['hi']
-                 nt.assert_equal(text.long_substr(data), 'hi')
-             def test_long_substr2():
-                 data = ['abc', 'abd', 'abf', 'ab']
-                 nt.assert_equal(text.long_substr(data), 'ab')
-             def test_long_substr_empty():
-                 data = []
-                 nt.assert_equal(text.long_substr(data), '')
              def test_strip_email():
                  src = """\
                      >> >>> def f(x):

IPython/utils/text.py

0 +16 -28

              import os
              import re
+             import string
              import sys
              import textwrap
              from string import Formatter
                  return out_ps
-             def long_substr(data):
-                 """Return the longest common substring in a list of strings.
-                 Credit: http://stackoverflow.com/questions/2892931/longest-common-substring-from-more-than-two-strings-python
-                 """
-                 substr = ''
-                 if len(data) > 1 and len(data[0]) > 0:
-                     for i in range(len(data[0])):
-                         for j in range(len(data[0])-i+1):
-                             if j > len(substr) and all(data[0][i:i+j] in x for x in data):
-                                 substr = data[0][i:i+j]
-                 elif len(data) == 1:
-                     substr = data[0]
-                 return substr
              def strip_email_quotes(text):
                  """Strip leading email quotation characters ('>').
                      In [4]: strip_email_quotes('> > text\\n> > more\\n> more...')
                      Out[4]: '> text\\n> more\\nmore...'
-                 So if any line has no quote marks ('>') , then none are stripped from any
+                 So if any line has no quote marks ('>'), then none are stripped from any
                  of them ::
                      In [5]: strip_email_quotes('> > text\\n> > more\\nlast different')
                      Out[5]: '> > text\\n> > more\\nlast different'
                  """
                  lines = text.splitlines()
-                 matches = set()
-                 for line in lines:
-                     prefix = re.match(r'^(\s*>[ >]*)', line)
-                     if prefix:
-                         matches.add(prefix.group(1))
+                 strip_len = 0
+                 for characters in zip(*lines):
+                     # Check if all characters in this position are the same
+                     if len(set(characters)) > 1:
+                         break
+                     prefix_char = characters[0][0]
+                     if prefix_char in string.whitespace or prefix_char == ">":
+                         strip_len += 1
                      else:
                          break
-                 else:
-                     prefix = long_substr(list(matches))
-                     if prefix:
-                         strip = len(prefix)
-                         text = '\n'.join([ ln[strip:] for ln in lines])
+                 text = "\n".join([ln[strip_len:] for ln in lines])
                  return text
              def strip_ansi(source):
                  """
                  Remove ansi escape codes from text.

General Comments 0

Write
Preview

You need to be logged in to leave comments. Login now

No TODOs yet

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages