##// END OF EJS Templates
add_anchor always return unicode
add_anchor always return unicode

File last commit:

r11937:516b6450
r11937:516b6450
Show More
strings.py
171 lines | 4.4 KiB | text/x-python | PythonLexer
MinRK
add html_text and add_anchor filters...
r11302 # coding: utf-8
Jonathan Frederic
Cleanup and refactor of filters
r10676 """String filters.
Jonathan Frederic
Moved wrap code into Strings utility file.
r10433
Jonathan Frederic
Cleanup and refactor of filters
r10676 Contains a collection of useful string manipulation filters for use in Jinja
templates.
Jonathan Frederic
Moved wrap code into Strings utility file.
r10433 """
#-----------------------------------------------------------------------------
# Copyright (c) 2013, the IPython Development Team.
#
# Distributed under the terms of the Modified BSD License.
#
# The full license is in the file COPYING.txt, distributed with this software.
#-----------------------------------------------------------------------------
#-----------------------------------------------------------------------------
# Imports
#-----------------------------------------------------------------------------
MinRK
fix `file/` URL replacements in nbconvert
r11202 import re
Jonathan Frederic
Cleanup and refactor of filters
r10676 import textwrap
MinRK
add html_text and add_anchor filters...
r11302 from xml.etree import ElementTree
MinRK
convert IPython syntax to Python syntax in nbconvert python template...
r11711
from IPython.core.interactiveshell import InteractiveShell
MinRK
add html_text and add_anchor filters...
r11302 from IPython.utils import py3compat
Brian E. Granger
Fixing import for nbconvert.
r11089
Jonathan Frederic
Moved wrap code into Strings utility file.
r10433 #-----------------------------------------------------------------------------
# Functions
#-----------------------------------------------------------------------------
Jonathan Frederic
Cleanup and refactor of filters
r10676
Brian E. Granger
Fixing import logic.
r11088 __all__ = [
Jonathan Frederic
Filter names cleanup
r11685 'wrap_text',
'html2text',
MinRK
add html_text and add_anchor filters...
r11302 'add_anchor',
Brian E. Granger
Fixing import logic.
r11088 'strip_dollars',
Jonathan Frederic
Filter names cleanup
r11685 'strip_files_prefix',
'comment_lines',
MinRK
convert IPython syntax to Python syntax in nbconvert python template...
r11711 'get_lines',
'ipython2python',
Brian E. Granger
Fixing import logic.
r11088 ]
Jonathan Frederic
Filter names cleanup
r11685 def wrap_text(text, width=100):
Jonathan Frederic
Cleanup and refactor of filters
r10676 """
Intelligently wrap text.
Wrap text without breaking words if possible.
Parameters
----------
text : str
Text to wrap.
width : int, optional
Number of characters to wrap to, default 100.
"""
Jonathan Frederic
Moved wrap code into Strings utility file.
r10433
Jonathan Frederic
Cleanup and refactor of filters
r10676 split_text = text.split('\n')
wrp = map(lambda x:textwrap.wrap(x,width), split_text)
Jonathan Frederic
Moved wrap code into Strings utility file.
r10433 wrpd = map('\n'.join, wrp)
Jonathan Frederic
Moved more code to Strings utilities file
r10434 return '\n'.join(wrpd)
MinRK
add html_text and add_anchor filters...
r11302
Jonathan Frederic
Filter names cleanup
r11685 def html2text(element):
MinRK
add html_text and add_anchor filters...
r11302 """extract inner text from html
Analog of jQuery's $(element).text()
"""
Jonathan Frederic
Fixes for Py3.3
r11547 if isinstance(element, py3compat.string_types):
MinRK
add html_text and add_anchor filters...
r11302 element = ElementTree.fromstring(element)
text = element.text or ""
for child in element:
Jonathan Frederic
Filter names cleanup
r11685 text += html2text(child)
MinRK
add html_text and add_anchor filters...
r11302 text += (element.tail or "")
return text
def add_anchor(html):
"""Add an anchor-link to an html header tag
MinRK
allow extra pandoc args
r11293
MinRK
add html_text and add_anchor filters...
r11302 For use in heading cells
MinRK
allow extra pandoc args
r11293 """
MinRK
add html_text and add_anchor filters...
r11302 h = ElementTree.fromstring(py3compat.cast_bytes_py2(html))
Jonathan Frederic
Filter names cleanup
r11685 link = html2text(h).replace(' ', '-')
MinRK
add html_text and add_anchor filters...
r11302 h.set('id', link)
a = ElementTree.Element("a", {"class" : "anchor-link", "href" : "#" + link})
a.text = u'¶'
h.append(a)
Jonathan Frederic
Moved add_anchor bytes-strings fix into add_anchor
r11927
# Known issue of Python3.x, ElementTree.tostring() returns a byte string
# instead of a text string. See issue http://bugs.python.org/issue10942
# Workaround is to make sure the bytes are casted to a string.
Jonathan Frederic
add_anchor always return unicode
r11937 return py3compat.str_to_unicode(py3compat.bytes_to_str(ElementTree.tostring(h)))
MinRK
allow extra pandoc args
r11293
Jonathan Frederic
Moved more code to Strings utilities file
r10434
def strip_dollars(text):
Jonathan Frederic
Cleanup and refactor of filters
r10676 """
Remove all dollar symbols from text
Parameters
----------
text : str
Text to remove dollars from
"""
Jonathan Frederic
Moved more code to Strings utilities file
r10434
Jonathan Frederic
Post code-review, extended refactor.
r10485 return text.strip('$')
jakobgager
Small latex mods: Escapes, Headings, Equations...
r10882
MinRK
fix `file/` URL replacements in nbconvert
r11202 files_url_pattern = re.compile(r'(src|href)\=([\'"]?)files/')
Jonathan Frederic
Filter names cleanup
r11685 def strip_files_prefix(text):
Jonathan Frederic
Cleanup and refactor of filters
r10676 """
MinRK
fix `file/` URL replacements in nbconvert
r11202 Fix all fake URLs that start with `files/`,
stripping out the `files/` prefix.
Jonathan Frederic
Cleanup and refactor of filters
r10676
Parameters
----------
text : str
MinRK
fix `file/` URL replacements in nbconvert
r11202 Text in which to replace 'src="files/real...' with 'src="real...'
Jonathan Frederic
Cleanup and refactor of filters
r10676 """
MinRK
fix `file/` URL replacements in nbconvert
r11202 return files_url_pattern.sub(r"\1=\2", text)
Jonathan Frederic
Post code-review, extended refactor.
r10485
Jonathan Frederic
Filter names cleanup
r11685 def comment_lines(text, prefix='# '):
Jonathan Frederic
Cleanup and refactor of filters
r10676 """
Build a Python comment line from input text.
Parameters
----------
text : str
Text to comment out.
Jonathan Frederic
Filter names cleanup
r11685 prefix : str
Character to append to the start of each line.
Jonathan Frederic
Cleanup and refactor of filters
r10676 """
#Replace line breaks with line breaks and comment symbols.
#Also add a comment symbol at the beginning to comment out
#the first line.
Jonathan Frederic
Filter names cleanup
r11685 return prefix + ('\n'+prefix).join(text.split('\n'))
Jonathan Frederic
Cleanup and refactor of filters
r10676
Jonathan Frederic
Post code-review, extended refactor.
r10485
Jonathan Frederic
Cleanup and refactor of filters
r10676 def get_lines(text, start=None,end=None):
Jonathan Frederic
Post code-review, extended refactor.
r10485 """
Split the input text into separate lines and then return the
lines that the caller is interested in.
Jonathan Frederic
Cleanup and refactor of filters
r10676
Parameters
----------
text : str
Text to parse lines from.
start : int, optional
First line to grab from.
end : int, optional
Last line to grab from.
Jonathan Frederic
Post code-review, extended refactor.
r10485 """
# Split the input into lines.
Jonathan Frederic
Cleanup and refactor of filters
r10676 lines = text.split("\n")
Jonathan Frederic
Post code-review, extended refactor.
r10485
# Return the right lines.
return "\n".join(lines[start:end]) #re-join
MinRK
convert IPython syntax to Python syntax in nbconvert python template...
r11711
def ipython2python(code):
"""Transform IPython syntax to pure Python syntax
Parameters
----------
code : str
IPython code, to be transformed to pure Python
"""
shell = InteractiveShell.instance()
return shell.input_transformer_manager.transform_cell(code)