upstream/ipython Commit - r11302:fdb4d7d0

add html_text and add_anchor filters...

MinRK -

r11302:fdb4d7d0

parent child

IPython/nbconvert/exporters/exporter.py

0 +2 0

              """This module defines Exporter, a highly configurable converter
              that uses Jinja2 to export notebook files into different formats.
              """
              #-----------------------------------------------------------------------------
              # Copyright (c) 2013, the IPython Development Team.
              #
              # Distributed under the terms of the Modified BSD License.
              #
              # The full license is in the file COPYING.txt, distributed with this software.
              #-----------------------------------------------------------------------------
              #-----------------------------------------------------------------------------
              # Imports
              #-----------------------------------------------------------------------------
              from __future__ import print_function, absolute_import
              # Stdlib imports
              import io
              import os
              import inspect
              from copy import deepcopy
              # other libs/dependencies
              from jinja2 import Environment, FileSystemLoader, ChoiceLoader
              # IPython imports
              from IPython.config.configurable import Configurable
              from IPython.config import Config
              from IPython.nbformat import current as nbformat
              from IPython.utils.traitlets import MetaHasTraits, Unicode
              from IPython.utils.text import indent
              from IPython.nbconvert import filters
              from IPython.nbconvert import transformers
              #-----------------------------------------------------------------------------
              # Globals and constants
              #-----------------------------------------------------------------------------
              #Jinja2 extensions to load.
              JINJA_EXTENSIONS = ['jinja2.ext.loopcontrols']
              default_filters = {
                      'indent': indent,
                      'markdown': filters.markdown2html,
                      'ansi2html': filters.ansi2html,
                      'filter_data_type': filters.DataTypeFilter,
                      'get_lines': filters.get_lines,
                      'highlight': filters.highlight,
                      'highlight2html': filters.highlight,
                      'highlight2latex': filters.highlight2latex,
                      'markdown2latex': filters.markdown2latex,
                      'markdown2rst': filters.markdown2rst,
                      'pycomment': filters.python_comment,
                      'rm_ansi': filters.remove_ansi,
                      'rm_dollars': filters.strip_dollars,
                      'rm_fake': filters.rm_fake,
+                     'html_text' : filters.html_text,
+                     'add_anchor': filters.add_anchor,
                      'ansi2latex': filters.ansi2latex,
                      'rm_math_space': filters.rm_math_space,
                      'wrap': filters.wrap
              }
              #-----------------------------------------------------------------------------
              # Class
              #-----------------------------------------------------------------------------
              class Exporter(Configurable):
                  """
                  Exports notebooks into other file formats.  Uses Jinja 2 templating engine
                  to output new formats.  Inherit from this class if you are creating a new
                  template type along with new filters/transformers.  If the filters/
                  transformers provided by default suffice, there is no need to inherit from
                  this class.  Instead, override the template_file and file_extension
                  traits via a config file.
                  {filters}
                  """
                  # finish the docstring
                  __doc__ = __doc__.format(filters = '- '+'\n    - '.join(default_filters.keys()))
                  template_file = Unicode(
                          '', config=True,
                          help="Name of the template file to use")
                  file_extension = Unicode(
                      'txt', config=True,
                      help="Extension of the file that should be written to disk"
                      )
                  template_path = Unicode(
                      os.path.join("..", "templates"), config=True,
                      help="Path where the template files are located.")
                  template_skeleton_path = Unicode(
                      os.path.join("..", "templates", "skeleton"), config=True,
                      help="Path where the template skeleton files are located.")
                  #Jinja block definitions
                  jinja_comment_block_start = Unicode("", config=True)
                  jinja_comment_block_end = Unicode("", config=True)
                  jinja_variable_block_start = Unicode("", config=True)
                  jinja_variable_block_end = Unicode("", config=True)
                  jinja_logic_block_start = Unicode("", config=True)
                  jinja_logic_block_end = Unicode("", config=True)
                  #Extension that the template files use.
                  template_extension = Unicode(".tpl", config=True)
                  #Processors that process the input data prior to the export, set in the
                  #constructor for this class.
                  transformers = None
                  def __init__(self, transformers=None, filters=None, config=None, extra_loaders=None, **kw):
                      """
                      Public constructor
                      Parameters
                      ----------
                      transformers : list[of transformer]
                          Custom transformers to apply to the notebook prior to engaging
                          the Jinja template engine.  Any transformers specified here
                          will override existing transformers if a naming conflict
                          occurs.
                      filters : dict[of filter]
                          filters specified here will override existing filters if a naming
                          conflict occurs. Filters are availlable in jinja template through
                          the name of the corresponding key. Cf class docstring for
                          availlable default filters.
                      config : config
                          User configuration instance.
                      extra_loaders : list[of Jinja Loaders]
                          ordered list of Jinja loder to find templates. Will be tried in order
                          before the default FileSysteme ones.
                      """
                      #Call the base class constructor
                      c = self.default_config
                      if config:
                          c.merge(config)
                      super(Exporter, self).__init__(config=c, **kw)
                      #Standard environment
                      self._init_environment(extra_loaders=extra_loaders)
                      #Add transformers
                      self._register_transformers()
                      #Add filters to the Jinja2 environment
                      self._register_filters()
                      #Load user transformers.  Overwrite existing transformers if need be.
                      if transformers :
                          for transformer in transformers:
                              self.register_transformer(transformer)
                      #Load user filters.  Overwrite existing filters if need be.
                      if not filters is None:
                          for key, user_filter in filters.iteritems():
                              self.register_filter(key, user_filter)
                  @property
                  def default_config(self):
                      return Config()
                  def from_notebook_node(self, nb, resources=None):
                      """
                      Convert a notebook from a notebook node instance.
                      Parameters
                      ----------
                      nb : Notebook node
                      resources : a dict of additional resources that
                              can be accessed read/write by transformers
                              and filters.
                      """
                      if resources is None:
                          resources = {}
                      nb, resources = self._preprocess(nb, resources)
                      #Load the template file.
                      self.template = self.environment.get_template(self.template_file+self.template_extension)
                      return self.template.render(nb=nb, resources=resources), resources
                  def from_filename(self, filename):
                      """
                      Convert a notebook from a notebook file.
                      Parameters
                      ----------
                      filename : str
                          Full filename of the notebook file to open and convert.
                      """
                      with io.open(filename) as f:
                          return self.from_notebook_node(nbformat.read(f, 'json'))
                  def from_file(self, file_stream):
                      """
                      Convert a notebook from a notebook file.
                      Parameters
                      ----------
                      file_stream : file-like object
                          Notebook file-like object to convert.
                      """
                      return self.from_notebook_node(nbformat.read(file_stream, 'json'))
                  def register_transformer(self, transformer):
                      """
                      Register a transformer.
                      Transformers are classes that act upon the notebook before it is
                      passed into the Jinja templating engine.  Transformers are also
                      capable of passing additional information to the Jinja
                      templating engine.
                      Parameters
                      ----------
                      transformer : transformer
                      """
                      if self.transformers is None:
                          self.transformers = []
                      if inspect.isfunction(transformer):
                          self.transformers.append(transformer)
                          return transformer
                      elif isinstance(transformer, MetaHasTraits):
                          transformer_instance = transformer(config=self.config)
                          self.transformers.append(transformer_instance)
                          return transformer_instance
                      else:
                          transformer_instance = transformer()
                          self.transformers.append(transformer_instance)
                          return transformer_instance
                  def register_filter(self, name, filter):
                      """
                      Register a filter.
                      A filter is a function that accepts and acts on one string.
                      The filters are accesible within the Jinja templating engine.
                      Parameters
                      ----------
                      name : str
                          name to give the filter in the Jinja engine
                      filter : filter
                      """
                      if inspect.isfunction(filter):
                          self.environment.filters[name] = filter
                      elif isinstance(filter, MetaHasTraits):
                          self.environment.filters[name] = filter(config=self.config)
                      else:
                          self.environment.filters[name] = filter()
                      return self.environment.filters[name]
                  def _register_transformers(self):
                      """
                      Register all of the transformers needed for this exporter.
                      """
                      self.register_transformer(transformers.coalesce_streams)
                      #Remember the figure extraction transformer so it can be enabled and
                      #disabled easily later.
                      self.extract_figure_transformer = self.register_transformer(transformers.ExtractFigureTransformer)
                  def _register_filters(self):
                      """
                      Register all of the filters required for the exporter.
                      """
                      for k, v in default_filters.iteritems():
                          self.register_filter(k, v)
                  def _init_environment(self, extra_loaders=None):
                      """
                      Create the Jinja templating environment.
                      """
                      here = os.path.dirname(os.path.realpath(__file__))
                      loaders = []
                      if extra_loaders:
                          loaders.extend(extra_loaders)
                      loaders.append(FileSystemLoader([
                              os.path.join(here, self.template_path),
                              os.path.join(here, self.template_skeleton_path),
                              ]))
                      self.environment = Environment(
                          loader= ChoiceLoader(loaders),
                          extensions=JINJA_EXTENSIONS
                          )
                      #Set special Jinja2 syntax that will not conflict with latex.
                      if self.jinja_logic_block_start:
                          self.environment.block_start_string = self.jinja_logic_block_start
                      if self.jinja_logic_block_end:
                          self.environment.block_end_string = self.jinja_logic_block_end
                      if self.jinja_variable_block_start:
                          self.environment.variable_start_string = self.jinja_variable_block_start
                      if self.jinja_variable_block_end:
                          self.environment.variable_end_string = self.jinja_variable_block_end
                      if self.jinja_comment_block_start:
                          self.environment.comment_start_string = self.jinja_comment_block_start
                      if self.jinja_comment_block_end:
                          self.environment.comment_end_string = self.jinja_comment_block_end
                  def _preprocess(self, nb, resources):
                      """
                      Preprocess the notebook before passing it into the Jinja engine.
                      To preprocess the notebook is to apply all of the
                      Parameters
                      ----------
                      nb : notebook node
                          notebook that is being exported.
                      resources : a dict of additional resources that
                          can be accessed read/write by transformers
                          and filters.
                      """
                      # Do a deepcopy first,
                      # we are never safe enough with what the transformers could do.
                      nbc =  deepcopy(nb)
                      resc = deepcopy(resources)
                      #Run each transformer on the notebook.  Carry the output along
                      #to each transformer
                      for transformer in self.transformers:
                          nb, resources = transformer(nbc, resc)
                      return nb, resources

IPython/nbconvert/filters/strings.py

0 +32 -4

+             # coding: utf-8
              """String filters.
              Contains a collection of useful string manipulation filters for use in Jinja
              templates.
              """
              #-----------------------------------------------------------------------------
              # Copyright (c) 2013, the IPython Development Team.
              #
              # Distributed under the terms of the Modified BSD License.
              #
              # The full license is in the file COPYING.txt, distributed with this software.
              #-----------------------------------------------------------------------------
              #-----------------------------------------------------------------------------
              # Imports
              #-----------------------------------------------------------------------------
              import re
              import textwrap
+             from xml.etree import ElementTree
+             from IPython.utils import py3compat
              #-----------------------------------------------------------------------------
              # Functions
              #-----------------------------------------------------------------------------
              __all__ = [
                  'wrap',
+                 'html_text',
+                 'add_anchor',
                  'strip_dollars',
                  'rm_fake',
                  'python_comment',
                  'get_lines'
              ]
              def wrap(text, width=100):
                  """
                  Intelligently wrap text.
                  Wrap text without breaking words if possible.
                  Parameters
                  ----------
                  text : str
                      Text to wrap.
                  width : int, optional
                      Number of characters to wrap to, default 100.
                  """
                  split_text = text.split('\n')
                  wrp = map(lambda x:textwrap.wrap(x,width), split_text)
                  wrpd = map('\n'.join, wrp)
                  return '\n'.join(wrpd)
-             def single_line(text):
-                 """Wrap multi-line text into a single line
+             def html_text(element):
+                 """extract inner text from html
+                 Analog of jQuery's $(element).text()
+                 """
+                 if not isinstance(element, (ElementTree.ElementTree, ElementTree.Element)):
+                     element = ElementTree.fromstring(element)
+                 text = element.text or ""
+                 for child in element:
+                     text += html_text(child)
+                 text += (element.tail or "")
+                 return text
+             def add_anchor(html):
+                 """Add an anchor-link to an html header tag
-                 Used in markdown heading cells, which are not allowed to be multiline.
+                 For use in heading cells
                  """
-                 return ''.join(text.splitlines())
+                 h = ElementTree.fromstring(py3compat.cast_bytes_py2(html))
+                 link = html_text(h).replace(' ', '-')
+                 h.set('id', link)
+                 a = ElementTree.Element("a", {"class" : "anchor-link", "href" : "#" + link})
+                 a.text = u'¶'
+                 h.append(a)
+                 return ElementTree.tostring(h)
              def strip_dollars(text):
                  """
                  Remove all dollar symbols from text
                  Parameters
                  ----------
                  text : str
                      Text to remove dollars from
                  """
                  return text.strip('$')
              files_url_pattern = re.compile(r'(src|href)\=([\'"]?)files/')
              def rm_fake(text):
                  """
                  Fix all fake URLs that start with `files/`,
                  stripping out the `files/` prefix.
                  Parameters
                  ----------
                  text : str
                      Text in which to replace 'src="files/real...' with 'src="real...'
                  """
                  return files_url_pattern.sub(r"\1=\2", text)
              def python_comment(text):
                  """
                  Build a Python comment line from input text.
                  Parameters
                  ----------
                  text : str
                      Text to comment out.
                  """
                  #Replace line breaks with line breaks and comment symbols.
                  #Also add a comment symbol at the beginning to comment out
                  #the first line.
                  return '# '+'\n# '.join(text.split('\n'))
              def get_lines(text, start=None,end=None):
                  """
                  Split the input text into separate lines and then return the
                  lines that the caller is interested in.
                  Parameters
                  ----------
                  text : str
                      Text to parse lines from.
                  start : int, optional
                      First line to grab from.
                  end : int, optional
                      Last line to grab from.
                  """
                  # Split the input into lines.
                  lines = text.split("\n")
                  # Return the right lines.
                  return "\n".join(lines[start:end]) #re-join

General Comments 0

Write
Preview

You need to be logged in to leave comments. Login now

No TODOs yet

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages