upstream/ipython Commit - r26615:c20d7a0d

Refactor strip_email_quotes...

Blazej Michalik -

r26615:c20d7a0d

parent child

IPython/utils/tests/test_text.py

0 0 -13

@@ -165,19 +165,6 b' def test_dollar_formatter():'
165	nt.assert_equal(s, "$HOME")	165	nt.assert_equal(s, "$HOME")
166		166
167		167
168	def test_long_substr():
169	data = ['hi']
170	nt.assert_equal(text.long_substr(data), 'hi')
171
172
173	def test_long_substr2():
174	data = ['abc', 'abd', 'abf', 'ab']
175	nt.assert_equal(text.long_substr(data), 'ab')
176
177	def test_long_substr_empty():
178	data = []
179	nt.assert_equal(text.long_substr(data), '')
180
181	def test_strip_email():	168	def test_strip_email():
182	src = """\	169	src = """\
183	>> >>> def f(x):	170	>> >>> def f(x):

IPython/utils/text.py

0 +16 -28

             import os
             import re
+            import string
             import sys
             import textwrap
             from string import Formatter
                 return out_ps
-            def long_substr(data):
-                """Return the longest common substring in a list of strings.
-                Credit: http://stackoverflow.com/questions/2892931/longest-common-substring-from-more-than-two-strings-python
-                """
-                substr = ''
-                if len(data) > 1 and len(data[0]) > 0:
-                    for i in range(len(data[0])):
-                        for j in range(len(data[0])-i+1):
-                            if j > len(substr) and all(data[0][i:i+j] in x for x in data):
-                                substr = data[0][i:i+j]
-                elif len(data) == 1:
-                    substr = data[0]
-                return substr
             def strip_email_quotes(text):
                 """Strip leading email quotation characters ('>').
                     In [4]: strip_email_quotes('> > text\\n> > more\\n> more...')
                     Out[4]: '> text\\n> more\\nmore...'
-                So if any line has no quote marks ('>') , then none are stripped from any
+                So if any line has no quote marks ('>'), then none are stripped from any
                 of them ::
                     In [5]: strip_email_quotes('> > text\\n> > more\\nlast different')
                     Out[5]: '> > text\\n> > more\\nlast different'
                 """
                 lines = text.splitlines()
-                matches = set()
+                strip_len = 0
-                for line in lines:
-                    prefix = re.match(r'^(\s*>[ >]*)', line)
+                for characters in zip(*lines):
-                    if prefix:
+                    # Check if all characters in this position are the same
-                        matches.add(prefix.group(1))
+                    if len(set(characters)) > 1:
+                        break
+                    prefix_char = characters[0][0]
+                    if prefix_char in string.whitespace or prefix_char == ">":
+                        strip_len += 1
                     else:
                         break
-                else:
-                    prefix = long_substr(list(matches))
+                text = "\n".join([ln[strip_len:] for ln in lines])
-                    if prefix:
-                        strip = len(prefix)
-                        text = '\n'.join([ ln[strip:] for ln in lines])
                 return text
             def strip_ansi(source):
                 """
                 Remove ansi escape codes from text.

General Comments 0

Write
Preview

You need to be logged in to leave comments. Login now

No TODOs yet

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages