##// END OF EJS Templates
Added exporter tests
Added exporter tests

File last commit:

r11476:6a905927 merge
r11480:87b152ef
Show More
exporter.py
441 lines | 15.6 KiB | text/x-python | PythonLexer
"""This module defines Exporter, a highly configurable converter
that uses Jinja2 to export notebook files into different formats.
"""
#-----------------------------------------------------------------------------
# Copyright (c) 2013, the IPython Development Team.
#
# Distributed under the terms of the Modified BSD License.
#
# The full license is in the file COPYING.txt, distributed with this software.
#-----------------------------------------------------------------------------
#-----------------------------------------------------------------------------
# Imports
#-----------------------------------------------------------------------------
from __future__ import print_function, absolute_import
# Stdlib imports
import io
import os
import inspect
import types
import copy
import collections
import datetime
# other libs/dependencies
from jinja2 import Environment, FileSystemLoader, ChoiceLoader
# IPython imports
from IPython.config.configurable import Configurable
from IPython.config import Config
from IPython.nbformat import current as nbformat
from IPython.utils.traitlets import MetaHasTraits, DottedObjectName, Unicode, List, Dict
from IPython.utils.importstring import import_item
from IPython.utils.text import indent
from IPython.nbconvert import transformers as nbtransformers
from IPython.nbconvert import filters
#-----------------------------------------------------------------------------
# Globals and constants
#-----------------------------------------------------------------------------
#Jinja2 extensions to load.
JINJA_EXTENSIONS = ['jinja2.ext.loopcontrols']
default_filters = {
'indent': indent,
'markdown': filters.markdown2html,
'ansi2html': filters.ansi2html,
'filter_data_type': filters.DataTypeFilter,
'get_lines': filters.get_lines,
'highlight': filters.highlight,
'highlight2html': filters.highlight,
'highlight2latex': filters.highlight2latex,
'markdown2latex': filters.markdown2latex,
'markdown2rst': filters.markdown2rst,
'pycomment': filters.python_comment,
'rm_ansi': filters.remove_ansi,
'rm_dollars': filters.strip_dollars,
'rm_fake': filters.rm_fake,
'html_text' : filters.html_text,
'add_anchor': filters.add_anchor,
'ansi2latex': filters.ansi2latex,
'rm_math_space': filters.rm_math_space,
'wrap': filters.wrap
}
#-----------------------------------------------------------------------------
# Class
#-----------------------------------------------------------------------------
class ResourcesDict(collections.defaultdict):
def __missing__(self, key):
return ''
class Exporter(Configurable):
"""
Exports notebooks into other file formats. Uses Jinja 2 templating engine
to output new formats. Inherit from this class if you are creating a new
template type along with new filters/transformers. If the filters/
transformers provided by default suffice, there is no need to inherit from
this class. Instead, override the template_file and file_extension
traits via a config file.
{filters}
"""
# finish the docstring
__doc__ = __doc__.format(filters = '- '+'\n - '.join(default_filters.keys()))
template_file = Unicode(
'', config=True,
help="Name of the template file to use")
file_extension = Unicode(
'txt', config=True,
help="Extension of the file that should be written to disk"
)
template_path = Unicode(
os.path.join("..", "templates"), config=True,
help="Path where the template files are located.")
template_skeleton_path = Unicode(
os.path.join("..", "templates", "skeleton"), config=True,
help="Path where the template skeleton files are located.")
#Jinja block definitions
jinja_comment_block_start = Unicode("", config=True)
jinja_comment_block_end = Unicode("", config=True)
jinja_variable_block_start = Unicode("", config=True)
jinja_variable_block_end = Unicode("", config=True)
jinja_logic_block_start = Unicode("", config=True)
jinja_logic_block_end = Unicode("", config=True)
#Extension that the template files use.
template_extension = Unicode(".tpl", config=True)
#Configurability, allows the user to easily add filters and transformers.
transformers = List(config=True,
help="""List of transformers, by name or namespace, to enable.""")
filters = Dict(config=True,
help="""Dictionary of filters, by name and namespace, to add to the Jinja
environment.""")
default_transformers = List([nbtransformers.coalesce_streams,
nbtransformers.SVG2PDFTransformer,
nbtransformers.ExtractFigureTransformer,
nbtransformers.CSSHTMLHeaderTransformer,
nbtransformers.RevealHelpTransformer,
nbtransformers.LatexTransformer,
nbtransformers.SphinxTransformer],
config=True,
help="""List of transformers available by default, by name, namespace,
instance, or type.""")
def __init__(self, config=None, extra_loaders=None, **kw):
"""
Public constructor
Parameters
----------
config : config
User configuration instance.
extra_loaders : list[of Jinja Loaders]
ordered list of Jinja loder to find templates. Will be tried in order
before the default FileSysteme ones.
"""
#Call the base class constructor
c = self.default_config
if config:
c.merge(config)
super(Exporter, self).__init__(config=c, **kw)
#Init
self._init_environment(extra_loaders=extra_loaders)
self._init_transformers()
self._init_filters()
@property
def default_config(self):
return Config()
def from_notebook_node(self, nb, resources=None, **kw):
"""
Convert a notebook from a notebook node instance.
Parameters
----------
nb : Notebook node
resources : dict (**kw)
of additional resources that can be accessed read/write by
transformers and filters.
"""
nb_copy = copy.deepcopy(nb)
resources = self._init_resources(resources)
#Preprocess
nb_copy, resources = self._transform(nb_copy, resources)
#Convert
self.template = self.environment.get_template(self.template_file + self.template_extension)
output = self.template.render(nb=nb_copy, resources=resources)
return output, resources
def from_filename(self, filename, resources=None, **kw):
"""
Convert a notebook from a notebook file.
Parameters
----------
filename : str
Full filename of the notebook file to open and convert.
"""
#Pull the metadata from the filesystem.
if resources is None:
resources = ResourcesDict()
if not 'metadata' in resources or resources['metadata'] == '':
resources['metadata'] = ResourcesDict()
basename = os.path.basename(filename)
notebook_name = basename[:basename.rfind('.')]
resources['metadata']['name'] = notebook_name
modified_date = datetime.datetime.fromtimestamp(os.path.getmtime(filename))
resources['metadata']['modified_date'] = modified_date.strftime("%B %-d, %Y")
with io.open(filename) as f:
return self.from_notebook_node(nbformat.read(f, 'json'), resources=resources,**kw)
def from_file(self, file_stream, resources=None, **kw):
"""
Convert a notebook from a notebook file.
Parameters
----------
file_stream : file-like object
Notebook file-like object to convert.
"""
return self.from_notebook_node(nbformat.read(file_stream, 'json'), resources=resources, **kw)
def register_transformer(self, transformer, enabled=False):
"""
Register a transformer.
Transformers are classes that act upon the notebook before it is
passed into the Jinja templating engine. Transformers are also
capable of passing additional information to the Jinja
templating engine.
Parameters
----------
transformer : transformer
"""
if transformer is None:
raise TypeError('transformer')
isclass = inspect.isclass(transformer)
constructed = not isclass
#Handle transformer's registration based on it's type
if constructed and isinstance(transformer, types.StringTypes):
#Transformer is a string, import the namespace and recursively call
#this register_transformer method
transformer_cls = import_item(transformer)
return self.register_transformer(transformer_cls, enabled)
if constructed and hasattr(transformer, '__call__'):
#Transformer is a function, no need to construct it.
#Register and return the transformer.
if enabled:
transformer.enabled = True
self._transformers.append(transformer)
return transformer
elif isclass and isinstance(transformer, MetaHasTraits):
#Transformer is configurable. Make sure to pass in new default for
#the enabled flag if one was specified.
self.register_transformer(transformer(parent=self), enabled)
elif isclass:
#Transformer is not configurable, construct it
self.register_transformer(transformer(), enabled)
else:
#Transformer is an instance of something without a __call__
#attribute.
raise TypeError('transformer')
def register_filter(self, name, filter):
"""
Register a filter.
A filter is a function that accepts and acts on one string.
The filters are accesible within the Jinja templating engine.
Parameters
----------
name : str
name to give the filter in the Jinja engine
filter : filter
"""
if filter is None:
raise TypeError('filter')
isclass = inspect.isclass(filter)
constructed = not isclass
#Handle filter's registration based on it's type
if constructed and isinstance(filter, types.StringTypes):
#filter is a string, import the namespace and recursively call
#this register_filter method
filter_cls = import_item(filter)
return self.register_filter(name, filter_cls)
if constructed and hasattr(filter, '__call__'):
#filter is a function, no need to construct it.
self.environment.filters[name] = filter
return filter
elif isclass and isinstance(filter, MetaHasTraits):
#filter is configurable. Make sure to pass in new default for
#the enabled flag if one was specified.
self.register_filter(name, filter(parent=self))
elif isclass:
#filter is not configurable, construct it
self.register_filter(name, filter())
else:
#filter is an instance of something without a __call__
#attribute.
raise TypeError('filter')
def _init_environment(self, extra_loaders=None):
"""
Create the Jinja templating environment.
"""
here = os.path.dirname(os.path.realpath(__file__))
loaders = []
if extra_loaders:
loaders.extend(extra_loaders)
loaders.append(FileSystemLoader([
os.path.join(here, self.template_path),
os.path.join(here, self.template_skeleton_path),
]))
self.environment = Environment(
loader= ChoiceLoader(loaders),
extensions=JINJA_EXTENSIONS
)
#Set special Jinja2 syntax that will not conflict with latex.
if self.jinja_logic_block_start:
self.environment.block_start_string = self.jinja_logic_block_start
if self.jinja_logic_block_end:
self.environment.block_end_string = self.jinja_logic_block_end
if self.jinja_variable_block_start:
self.environment.variable_start_string = self.jinja_variable_block_start
if self.jinja_variable_block_end:
self.environment.variable_end_string = self.jinja_variable_block_end
if self.jinja_comment_block_start:
self.environment.comment_start_string = self.jinja_comment_block_start
if self.jinja_comment_block_end:
self.environment.comment_end_string = self.jinja_comment_block_end
def _init_transformers(self):
"""
Register all of the transformers needed for this exporter, disabled
unless specified explicitly.
"""
self._transformers = []
#Load default transformers (not necessarly enabled by default).
if self.default_transformers:
for transformer in self.default_transformers:
self.register_transformer(transformer)
#Load user transformers. Enable by default.
if self.transformers:
for transformer in self.transformers:
self.register_transformer(transformer, enabled=True)
def _init_filters(self):
"""
Register all of the filters required for the exporter.
"""
#Add default filters to the Jinja2 environment
for key, value in default_filters.iteritems():
self.register_filter(key, value)
#Load user filters. Overwrite existing filters if need be.
if self.filters:
for key, user_filter in self.filters.iteritems():
self.register_filter(key, user_filter)
def _init_resources(self, resources):
#Make sure the resources dict is of ResourcesDict type.
if resources is None:
resources = ResourcesDict()
if not isinstance(resources, ResourcesDict):
new_resources = ResourcesDict()
new_resources.update(resources)
resources = new_resources
#Make sure the metadata extension exists in resources
if 'metadata' in resources:
if not isinstance(resources['metadata'], ResourcesDict):
resources['metadata'] = ResourcesDict(resources['metadata'])
else:
resources['metadata'] = ResourcesDict()
if not resources['metadata']['name']:
resources['metadata']['name'] = 'Notebook'
#Set the output extension
resources['output_extension'] = self.file_extension
return resources
def _transform(self, nb, resources):
"""
Preprocess the notebook before passing it into the Jinja engine.
To preprocess the notebook is to apply all of the
Parameters
----------
nb : notebook node
notebook that is being exported.
resources : a dict of additional resources that
can be accessed read/write by transformers
and filters.
"""
# Do a copy.deepcopy first,
# we are never safe enough with what the transformers could do.
nbc = copy.deepcopy(nb)
resc = copy.deepcopy(resources)
#Run each transformer on the notebook. Carry the output along
#to each transformer
for transformer in self._transformers:
nbc, resc = transformer(nbc, resc)
return nbc, resc