nbconvert.py
706 lines
| 21.7 KiB
| text/x-python
|
PythonLexer
Fernando Perez
|
r6220 | #!/usr/bin/env python | ||
Paul Ivanov
|
r6280 | """Convert IPython notebooks to other formats, such as ReST, and HTML. | ||
Fernando Perez
|
r6220 | |||
Paul Ivanov
|
r6280 | Example: | ||
./nbconvert.py --format html file.ipynb | ||||
Fernando Perez
|
r6220 | |||
Produces 'file.rst' and 'file.html', along with auto-generated figure files | ||||
Paul Ivanov
|
r6280 | called nb_figure_NN.png. To avoid the two-step process, ipynb -> rst -> html, | ||
use '--format quick-html' which will do ipynb -> html, but won't look as | ||||
pretty. | ||||
Fernando Perez
|
r6220 | """ | ||
Fernando Perez
|
r6677 | #----------------------------------------------------------------------------- | ||
# Imports | ||||
#----------------------------------------------------------------------------- | ||||
Fernando Perez
|
r6671 | from __future__ import print_function | ||
Fernando Perez
|
r6220 | |||
Fernando Perez
|
r6677 | # Stdlib | ||
Fernando Perez
|
r6672 | import codecs | ||
Fernando Perez
|
r6674 | import logging | ||
Fernando Perez
|
r6220 | import os | ||
Fernando Perez
|
r6671 | import pprint | ||
import re | ||||
Fernando Perez
|
r6220 | import subprocess | ||
import sys | ||||
Fernando Perez
|
r6671 | |||
Fernando Perez
|
r6677 | # From IPython | ||
Paul Ivanov
|
r6262 | from IPython.external import argparse | ||
Fernando Perez
|
r6220 | from IPython.nbformat import current as nbformat | ||
Paul Ivanov
|
r6257 | from IPython.utils.text import indent | ||
Anton I. Sipos
|
r6266 | from decorators import DocInherit | ||
Fernando Perez
|
r6220 | |||
Fernando Perez
|
r6677 | #----------------------------------------------------------------------------- | ||
# Utility functions | ||||
#----------------------------------------------------------------------------- | ||||
def remove_fake_files_url(cell): | ||||
"""Remove from the cell source the /files/ pseudo-path we use. | ||||
""" | ||||
src = cell.source | ||||
cell.source = src.replace('/files/', '') | ||||
Fernando Perez
|
r6671 | def remove_ansi(src): | ||
"""Strip all ANSI color escape sequences from input string. | ||||
Parameters | ||||
---------- | ||||
src : string | ||||
Returns | ||||
------- | ||||
string | ||||
""" | ||||
return re.sub(r'\033\[(0|\d;\d\d)m', '', src) | ||||
Fernando Perez
|
r6677 | |||
Fernando Perez
|
r6671 | # Pandoc-dependent code | ||
def markdown2latex(src): | ||||
"""Convert a markdown string to LaTeX via pandoc. | ||||
Fernando Perez
|
r6220 | |||
Fernando Perez
|
r6671 | This function will raise an error if pandoc is not installed. | ||
Any error messages generated by pandoc are printed to stderr. | ||||
Parameters | ||||
---------- | ||||
src : string | ||||
Input string, assumed to be valid markdown. | ||||
Returns | ||||
------- | ||||
out : string | ||||
Output as returned by pandoc. | ||||
Fernando Perez
|
r6220 | """ | ||
Fernando Perez
|
r6671 | p = subprocess.Popen('pandoc -f markdown -t latex'.split(), | ||
stdin=subprocess.PIPE, stdout=subprocess.PIPE) | ||||
out, err = p.communicate(src) | ||||
if err: | ||||
print(err, file=sys.stderr) | ||||
#print('*'*20+'\n', out, '\n'+'*'*20) # dbg | ||||
return out | ||||
Fernando Perez
|
r6220 | |||
Fernando Perez
|
r6222 | def rst_directive(directive, text=''): | ||
out = [directive, ''] | ||||
if text: | ||||
out.extend([indent(text), '']) | ||||
return out | ||||
Fernando Perez
|
r6220 | |||
Fernando Perez
|
r6677 | #----------------------------------------------------------------------------- | ||
# Class declarations | ||||
#----------------------------------------------------------------------------- | ||||
Anton I. Sipos
|
r6261 | |||
Paul Ivanov
|
r6239 | class ConversionException(Exception): | ||
pass | ||||
Anton I. Sipos
|
r6253 | |||
Paul Ivanov
|
r6239 | class Converter(object): | ||
default_encoding = 'utf-8' | ||||
Fernando Perez
|
r6672 | extension = str() | ||
Fernando Perez
|
r6671 | figures_counter = 0 | ||
Fernando Perez
|
r6672 | infile = str() | ||
infile_dir = str() | ||||
infile_root = str() | ||||
files_dir = str() | ||||
Fernando Perez
|
r6673 | with_preamble = True | ||
user_preamble = None | ||||
output = str() | ||||
Fernando Perez
|
r6674 | raw_as_verbatim = False | ||
Fernando Perez
|
r6673 | |||
Anton I. Sipos
|
r6261 | def __init__(self, infile): | ||
self.infile = infile | ||||
Fernando Perez
|
r6672 | self.infile_dir = os.path.dirname(infile) | ||
infile_root = os.path.splitext(infile)[0] | ||||
files_dir = infile_root + '_files' | ||||
if not os.path.isdir(files_dir): | ||||
os.mkdir(files_dir) | ||||
self.infile_root = infile_root | ||||
self.files_dir = files_dir | ||||
Paul Ivanov
|
r6239 | |||
Anton I. Sipos
|
r6253 | def dispatch(self, cell_type): | ||
Paul Ivanov
|
r6239 | """return cell_type dependent render method, for example render_code | ||
""" | ||||
Fernando Perez
|
r6671 | return getattr(self, 'render_' + cell_type, self.render_unknown) | ||
Paul Ivanov
|
r6239 | |||
def convert(self): | ||||
lines = [] | ||||
Paul Ivanov
|
r6267 | lines.extend(self.optional_header()) | ||
Fernando Perez
|
r6671 | for worksheet in self.nb.worksheets: | ||
for cell in worksheet.cells: | ||||
Fernando Perez
|
r6674 | #print(cell.cell_type) # dbg | ||
Fernando Perez
|
r6671 | conv_fn = self.dispatch(cell.cell_type) | ||
Fernando Perez
|
r6677 | if cell.cell_type in ('markdown', 'raw'): | ||
remove_fake_files_url(cell) | ||||
Fernando Perez
|
r6671 | lines.extend(conv_fn(cell)) | ||
lines.append('') | ||||
Paul Ivanov
|
r6267 | lines.extend(self.optional_footer()) | ||
Paul Ivanov
|
r6239 | return '\n'.join(lines) | ||
def render(self): | ||||
Anton I. Sipos
|
r6261 | "read, convert, and save self.infile" | ||
Paul Ivanov
|
r6239 | self.read() | ||
self.output = self.convert() | ||||
return self.save() | ||||
def read(self): | ||||
"read and parse notebook into NotebookNode called self.nb" | ||||
Anton I. Sipos
|
r6261 | with open(self.infile) as f: | ||
Paul Ivanov
|
r6239 | self.nb = nbformat.read(f, 'json') | ||
Anton I. Sipos
|
r6261 | def save(self, infile=None, encoding=None): | ||
Paul Ivanov
|
r6239 | "read and parse notebook into self.nb" | ||
Anton I. Sipos
|
r6261 | if infile is None: | ||
Stefan van der Walt
|
r6680 | outfile = os.path.basename(self.infile) | ||
outfile = os.path.splitext(outfile)[0] + '.' + self.extension | ||||
Paul Ivanov
|
r6239 | if encoding is None: | ||
encoding = self.default_encoding | ||||
Stefan van der Walt
|
r6680 | with open(outfile, 'w') as f: | ||
Paul Ivanov
|
r6239 | f.write(self.output.encode(encoding)) | ||
Stefan van der Walt
|
r6680 | return os.path.abspath(outfile) | ||
Fernando Perez
|
r6220 | |||
Paul Ivanov
|
r6279 | def optional_header(self): | ||
return [] | ||||
Paul Ivanov
|
r6267 | |||
Paul Ivanov
|
r6279 | def optional_footer(self): | ||
return [] | ||||
Paul Ivanov
|
r6267 | |||
Fernando Perez
|
r6672 | def _new_figure(self, data, fmt): | ||
"""Create a new figure file in the given format. | ||||
Returns a path relative to the input file. | ||||
""" | ||||
figname = '%s_fig_%02i.%s' % (self.infile_root, | ||||
self.figures_counter, fmt) | ||||
Fernando Perez
|
r6671 | self.figures_counter += 1 | ||
Fernando Perez
|
r6672 | fullname = os.path.join(self.files_dir, figname) | ||
# Binary files are base64-encoded, SVG is already XML | ||||
if fmt in ('png', 'jpg', 'pdf'): | ||||
data = data.decode('base64') | ||||
fopen = lambda fname: open(fname, 'wb') | ||||
else: | ||||
fopen = lambda fname: codecs.open(fname, 'wb', self.default_encoding) | ||||
with fopen(fullname) as f: | ||||
f.write(data) | ||||
return fullname | ||||
Fernando Perez
|
r6671 | |||
Anton I. Sipos
|
r6253 | def render_heading(self, cell): | ||
Anton I. Sipos
|
r6266 | """convert a heading cell | ||
Returns list.""" | ||||
Anton I. Sipos
|
r6253 | raise NotImplementedError | ||
def render_code(self, cell): | ||||
Anton I. Sipos
|
r6266 | """Convert a code cell | ||
Returns list.""" | ||||
Anton I. Sipos
|
r6253 | raise NotImplementedError | ||
Paul Ivanov
|
r6249 | |||
Anton I. Sipos
|
r6253 | def render_markdown(self, cell): | ||
Anton I. Sipos
|
r6266 | """convert a markdown cell | ||
Returns list.""" | ||||
Anton I. Sipos
|
r6253 | raise NotImplementedError | ||
Paul Ivanov
|
r6249 | |||
Fernando Perez
|
r6671 | def render_pyout(self, output): | ||
Anton I. Sipos
|
r6266 | """convert pyout part of a code cell | ||
Returns list.""" | ||||
Anton I. Sipos
|
r6253 | raise NotImplementedError | ||
Paul Ivanov
|
r6249 | |||
Fernando Perez
|
r6671 | |||
def render_pyerr(self, output): | ||||
"""convert pyerr part of a code cell | ||||
Returns list.""" | ||||
raise NotImplementedError | ||||
Fernando Perez
|
r6672 | def _img_lines(self, img_file): | ||
"""Return list of lines to include an image file.""" | ||||
# Note: subclasses may choose to implement format-specific _FMT_lines | ||||
# methods if they so choose (FMT in {png, svg, jpg, pdf}). | ||||
raise NotImplementedError | ||||
Fernando Perez
|
r6671 | def render_display_data(self, output): | ||
Anton I. Sipos
|
r6266 | """convert display data from the output of a code cell | ||
Returns list. | ||||
""" | ||||
Fernando Perez
|
r6672 | lines = [] | ||
for fmt in ['png', 'svg', 'jpg', 'pdf']: | ||||
if fmt in output: | ||||
img_file = self._new_figure(output[fmt], fmt) | ||||
# Subclasses can have format-specific render functions (e.g., | ||||
# latex has to auto-convert all SVG to PDF first). | ||||
lines_fun = getattr(self, '_%s_lines' % fmt, None) | ||||
if not lines_fun: | ||||
lines_fun = self._img_lines | ||||
lines.extend(lines_fun(img_file)) | ||||
return lines | ||||
Paul Ivanov
|
r6249 | |||
Anton I. Sipos
|
r6253 | def render_stream(self, cell): | ||
Anton I. Sipos
|
r6266 | """convert stream part of a code cell | ||
Returns list.""" | ||||
raise NotImplementedError | ||||
Fernando Perez
|
r6674 | def render_raw(self, cell): | ||
"""convert a cell with raw text | ||||
Anton I. Sipos
|
r6266 | |||
Returns list.""" | ||||
Anton I. Sipos
|
r6253 | raise NotImplementedError | ||
Fernando Perez
|
r6220 | |||
Fernando Perez
|
r6671 | def render_unknown(self, cell): | ||
"""Render cells of unkown type | ||||
Returns list.""" | ||||
Fernando Perez
|
r6674 | data = pprint.pformat(cell) | ||
logging.warning('Unknown cell:\n%s' % data) | ||||
return self._unknown_lines(data) | ||||
def _unknown_lines(self, data): | ||||
"""Return list of lines for an unknown cell. | ||||
Parameters | ||||
---------- | ||||
data : str | ||||
The content of the unknown data as a single string. | ||||
""" | ||||
Fernando Perez
|
r6671 | raise NotImplementedError | ||
Paul Ivanov
|
r6249 | |||
Paul Ivanov
|
r6239 | class ConverterRST(Converter): | ||
extension = 'rst' | ||||
Paul Ivanov
|
r6264 | heading_level = {1: '=', 2: '-', 3: '`', 4: '\'', 5: '.', 6: '~'} | ||
Anton I. Sipos
|
r6253 | |||
Anton I. Sipos
|
r6266 | @DocInherit | ||
Anton I. Sipos
|
r6253 | def render_heading(self, cell): | ||
Paul Ivanov
|
r6264 | marker = self.heading_level[cell.level] | ||
Anton I. Sipos
|
r6253 | return ['{0}\n{1}\n'.format(cell.source, marker * len(cell.source))] | ||
Fernando Perez
|
r6220 | |||
Anton I. Sipos
|
r6266 | @DocInherit | ||
Anton I. Sipos
|
r6253 | def render_code(self, cell): | ||
Paul Ivanov
|
r6239 | if not cell.input: | ||
return [] | ||||
Fernando Perez
|
r6220 | |||
Paul Ivanov
|
r6239 | lines = ['In[%s]:' % cell.prompt_number, ''] | ||
lines.extend(rst_directive('.. code:: python', cell.input)) | ||||
Fernando Perez
|
r6220 | |||
Paul Ivanov
|
r6239 | for output in cell.outputs: | ||
conv_fn = self.dispatch(output.output_type) | ||||
lines.extend(conv_fn(output)) | ||||
Anton I. Sipos
|
r6266 | |||
Paul Ivanov
|
r6239 | return lines | ||
Fernando Perez
|
r6220 | |||
Anton I. Sipos
|
r6266 | @DocInherit | ||
Anton I. Sipos
|
r6253 | def render_markdown(self, cell): | ||
Paul Ivanov
|
r6239 | return [cell.source] | ||
Fernando Perez
|
r6220 | |||
Anton I. Sipos
|
r6266 | @DocInherit | ||
Fernando Perez
|
r6674 | def render_raw(self, cell): | ||
if self.raw_as_verbatim: | ||||
return ['::', '', indent(cell.source), ''] | ||||
else: | ||||
return [cell.source] | ||||
Anton I. Sipos
|
r6256 | |||
Anton I. Sipos
|
r6266 | @DocInherit | ||
Anton I. Sipos
|
r6253 | def render_pyout(self, output): | ||
Paul Ivanov
|
r6239 | lines = ['Out[%s]:' % output.prompt_number, ''] | ||
Paul Ivanov
|
r6249 | |||
Anton I. Sipos
|
r6252 | # output is a dictionary like object with type as a key | ||
Paul Ivanov
|
r6239 | if 'latex' in output: | ||
lines.extend(rst_directive('.. math::', output.latex)) | ||||
Fernando Perez
|
r6220 | |||
Paul Ivanov
|
r6239 | if 'text' in output: | ||
lines.extend(rst_directive('.. parsed-literal::', output.text)) | ||||
Fernando Perez
|
r6220 | |||
Paul Ivanov
|
r6239 | return lines | ||
Fernando Perez
|
r6220 | |||
Anton I. Sipos
|
r6266 | @DocInherit | ||
Fernando Perez
|
r6674 | def render_pyerr(self, output): | ||
# Note: a traceback is a *list* of frames. | ||||
return ['::', '', indent(remove_ansi('\n'.join(output.traceback))), ''] | ||||
@DocInherit | ||||
Fernando Perez
|
r6672 | def _img_lines(self, img_file): | ||
Fernando Perez
|
r6673 | return ['.. image:: %s' % img_file, ''] | ||
Fernando Perez
|
r6672 | |||
Anton I. Sipos
|
r6266 | @DocInherit | ||
Anton I. Sipos
|
r6253 | def render_stream(self, output): | ||
Paul Ivanov
|
r6249 | lines = [] | ||
if 'text' in output: | ||||
lines.extend(rst_directive('.. parsed-literal::', output.text)) | ||||
Paul Ivanov
|
r6239 | return lines | ||
Fernando Perez
|
r6220 | |||
Fernando Perez
|
r6671 | @DocInherit | ||
Fernando Perez
|
r6674 | def _unknown_lines(self, data): | ||
return rst_directive('.. warning:: Unknown cell') + [data] | ||||
Fernando Perez
|
r6671 | |||
Fernando Perez
|
r6673 | |||
Paul Ivanov
|
r6267 | class ConverterQuickHTML(Converter): | ||
extension = 'html' | ||||
Fernando Perez
|
r6674 | def in_tag(self, tag, src): | ||
"""Return a list of elements bracketed by the given tag""" | ||||
return ['<%s>' % tag, src, '</%s>' % tag] | ||||
Paul Ivanov
|
r6267 | def optional_header(self): | ||
# XXX: inject the IPython standard CSS into here | ||||
s = """<html> | ||||
<head> | ||||
</head> | ||||
<body> | ||||
""" | ||||
return s.splitlines() | ||||
def optional_footer(self): | ||||
s = """</body> | ||||
</html> | ||||
""" | ||||
return s.splitlines() | ||||
@DocInherit | ||||
def render_heading(self, cell): | ||||
marker = cell.level | ||||
return ['<h{1}>\n {0}\n</h{1}>'.format(cell.source, marker)] | ||||
@DocInherit | ||||
def render_code(self, cell): | ||||
if not cell.input: | ||||
return [] | ||||
lines = ['<table>'] | ||||
lines.append('<tr><td><tt>In [<b>%s</b>]:</tt></td><td><tt>' % cell.prompt_number) | ||||
lines.append("<br>\n".join(cell.input.splitlines())) | ||||
lines.append('</tt></td></tr>') | ||||
for output in cell.outputs: | ||||
lines.append('<tr><td></td><td>') | ||||
conv_fn = self.dispatch(output.output_type) | ||||
lines.extend(conv_fn(output)) | ||||
lines.append('</td></tr>') | ||||
lines.append('</table>') | ||||
return lines | ||||
@DocInherit | ||||
def render_markdown(self, cell): | ||||
Fernando Perez
|
r6674 | return self.in_tag('pre', cell.source) | ||
Paul Ivanov
|
r6267 | |||
@DocInherit | ||||
Fernando Perez
|
r6674 | def render_raw(self, cell): | ||
if self.raw_as_verbatim: | ||||
return self.in_tag('pre', cell.source) | ||||
else: | ||||
return [cell.source] | ||||
Paul Ivanov
|
r6267 | |||
@DocInherit | ||||
def render_pyout(self, output): | ||||
Fernando Perez
|
r6674 | lines = ['<tr><td><tt>Out[<b>%s</b>]:</tt></td></tr>' % | ||
output.prompt_number, '<td>'] | ||||
Paul Ivanov
|
r6267 | |||
# output is a dictionary like object with type as a key | ||||
Fernando Perez
|
r6674 | for out_type in ('text', 'latex'): | ||
if out_type in output: | ||||
lines.extend(self.in_tag('pre', indent(output[out_type]))) | ||||
Paul Ivanov
|
r6267 | |||
return lines | ||||
@DocInherit | ||||
Fernando Perez
|
r6674 | def render_pyerr(self, output): | ||
# Note: a traceback is a *list* of frames. | ||||
return self.in_tag('pre', remove_ansi('\n'.join(output.traceback))) | ||||
@DocInherit | ||||
Fernando Perez
|
r6672 | def _img_lines(self, img_file): | ||
return ['<img src="%s">' % img_file, ''] | ||||
Paul Ivanov
|
r6267 | |||
@DocInherit | ||||
def render_stream(self, output): | ||||
lines = [] | ||||
if 'text' in output: | ||||
lines.append(output.text) | ||||
return lines | ||||
Anton I. Sipos
|
r6253 | |||
Fernando Perez
|
r6674 | @DocInherit | ||
def _unknown_lines(self, data): | ||||
return ['<h2>Warning:: Unknown cell</h2>'] + self.in_tag('pre', data) | ||||
Fernando Perez
|
r6671 | |||
class ConverterLaTeX(Converter): | ||||
Fernando Perez
|
r6672 | """Converts a notebook to a .tex file suitable for pdflatex. | ||
Note: this converter *needs*: | ||||
- `pandoc`: for all conversion of markdown cells. If your notebook only | ||||
has Raw cells, pandoc will not be needed. | ||||
- `inkscape`: if your notebook has SVG figures. These need to be | ||||
converted to PDF before inclusion in the TeX file, as LaTeX doesn't | ||||
understand SVG natively. | ||||
You will in general obtain much better final PDF results if you configure | ||||
the matplotlib backend to create SVG output with | ||||
%config InlineBackend.figure_format = 'svg' | ||||
(or set the equivalent flag at startup or in your configuration profile). | ||||
""" | ||||
Fernando Perez
|
r6671 | extension = 'tex' | ||
Fernando Perez
|
r6673 | documentclass = 'article' | ||
documentclass_options = '11pt,english' | ||||
heading_map = {1: r'\section', | ||||
2: r'\subsection', | ||||
3: r'\subsubsection', | ||||
4: r'\paragraph', | ||||
5: r'\subparagraph', | ||||
6: r'\subparagraph'} | ||||
Fernando Perez
|
r6671 | |||
Fernando Perez
|
r6674 | def in_env(self, environment, lines): | ||
Fernando Perez
|
r6671 | """Return list of environment lines for input lines | ||
Parameters | ||||
---------- | ||||
env : string | ||||
Name of the environment to bracket with begin/end. | ||||
lines: """ | ||||
out = [r'\begin{%s}' % environment] | ||||
if isinstance(lines, basestring): | ||||
out.append(lines) | ||||
else: # list | ||||
out.extend(lines) | ||||
out.append(r'\end{%s}' % environment) | ||||
return out | ||||
Fernando Perez
|
r6673 | |||
def convert(self): | ||||
# The main body is done by the logic in the parent class, and that's | ||||
# all we need if preamble support has been turned off. | ||||
body = super(ConverterLaTeX, self).convert() | ||||
if not self.with_preamble: | ||||
return body | ||||
# But if preamble is on, then we need to construct a proper, standalone | ||||
# tex file. | ||||
# Tag the document at the top and set latex class | ||||
final = [ r'%% This file was auto-generated by IPython, do NOT edit', | ||||
r'%% Conversion from the original notebook file:', | ||||
r'%% {0}'.format(self.infile), | ||||
r'%%', | ||||
r'\documentclass[%s]{%s}' % (self.documentclass_options, | ||||
self.documentclass), | ||||
'', | ||||
] | ||||
# Load our own preamble, which is stored next to the main file. We | ||||
# need to be careful in case the script entry point is a symlink | ||||
myfile = __file__ if not os.path.islink(__file__) else \ | ||||
os.readlink(__file__) | ||||
with open(os.path.join(os.path.dirname(myfile), 'preamble.tex')) as f: | ||||
final.append(f.read()) | ||||
# Load any additional user-supplied preamble | ||||
if self.user_preamble: | ||||
final.extend(['', '%% Adding user preamble from file:', | ||||
'%% {0}'.format(self.user_preamble), '']) | ||||
with open(self.user_preamble) as f: | ||||
final.append(f.read()) | ||||
# Include document body | ||||
final.extend([ r'\begin{document}', '', | ||||
body, | ||||
r'\end{document}', '']) | ||||
# Retun value must be a string | ||||
return '\n'.join(final) | ||||
Fernando Perez
|
r6671 | @DocInherit | ||
def render_heading(self, cell): | ||||
Fernando Perez
|
r6673 | marker = self.heading_map[cell.level] | ||
Fernando Perez
|
r6675 | return ['%s{%s}' % (marker, cell.source) ] | ||
Fernando Perez
|
r6671 | |||
@DocInherit | ||||
def render_code(self, cell): | ||||
if not cell.input: | ||||
return [] | ||||
# Cell codes first carry input code, we use lstlisting for that | ||||
lines = [r'\begin{codecell}'] | ||||
Fernando Perez
|
r6674 | lines.extend(self.in_env('codeinput', | ||
self.in_env('lstlisting', cell.input))) | ||||
Fernando Perez
|
r6671 | |||
outlines = [] | ||||
for output in cell.outputs: | ||||
conv_fn = self.dispatch(output.output_type) | ||||
outlines.extend(conv_fn(output)) | ||||
# And then output of many possible types; use a frame for all of it. | ||||
if outlines: | ||||
Fernando Perez
|
r6674 | lines.extend(self.in_env('codeoutput', outlines)) | ||
Fernando Perez
|
r6671 | |||
lines.append(r'\end{codecell}') | ||||
return lines | ||||
Fernando Perez
|
r6672 | @DocInherit | ||
def _img_lines(self, img_file): | ||||
Fernando Perez
|
r6674 | return self.in_env('center', | ||
Fernando Perez
|
r6672 | [r'\includegraphics[width=3in]{%s}' % img_file, r'\par']) | ||
def _svg_lines(self, img_file): | ||||
base_file = os.path.splitext(img_file)[0] | ||||
pdf_file = base_file + '.pdf' | ||||
subprocess.check_call(['inkscape', '--export-pdf=%s' % pdf_file, | ||||
img_file]) | ||||
return self._img_lines(pdf_file) | ||||
Fernando Perez
|
r6671 | |||
@DocInherit | ||||
def render_stream(self, output): | ||||
lines = [] | ||||
if 'text' in output: | ||||
Fernando Perez
|
r6674 | lines.extend(self.in_env('verbatim', output.text.strip())) | ||
Fernando Perez
|
r6671 | |||
return lines | ||||
@DocInherit | ||||
def render_markdown(self, cell): | ||||
Fernando Perez
|
r6677 | return [markdown2latex(cell.source)] | ||
Fernando Perez
|
r6671 | |||
@DocInherit | ||||
def render_pyout(self, output): | ||||
lines = [] | ||||
# output is a dictionary like object with type as a key | ||||
if 'latex' in output: | ||||
lines.extend(output.latex) | ||||
if 'text' in output: | ||||
Fernando Perez
|
r6674 | lines.extend(self.in_env('verbatim', output.text)) | ||
Fernando Perez
|
r6671 | |||
return lines | ||||
@DocInherit | ||||
def render_pyerr(self, output): | ||||
# Note: a traceback is a *list* of frames. | ||||
Fernando Perez
|
r6674 | return self.in_env('traceback', | ||
self.in_env('verbatim', | ||||
Fernando Perez
|
r6671 | remove_ansi('\n'.join(output.traceback)))) | ||
@DocInherit | ||||
Fernando Perez
|
r6674 | def render_raw(self, cell): | ||
if self.raw_as_verbatim: | ||||
return self.in_env('verbatim', cell.source) | ||||
else: | ||||
return [cell.source] | ||||
@DocInherit | ||||
def _unknown_lines(self, data): | ||||
return [r'{\vspace{5mm}\bf WARNING:: unknown cell:}'] + \ | ||||
self.in_env('verbatim', data) | ||||
Fernando Perez
|
r6671 | |||
Fernando Perez
|
r6677 | #----------------------------------------------------------------------------- | ||
# Standalone conversion functions | ||||
#----------------------------------------------------------------------------- | ||||
Fernando Perez
|
r6671 | |||
Anton I. Sipos
|
r6261 | def rst2simplehtml(infile): | ||
Fernando Perez
|
r6220 | """Convert a rst file to simplified html suitable for blogger. | ||
This just runs rst2html with certain parameters to produce really simple | ||||
html and strips the document header, so the resulting file can be easily | ||||
pasted into a blogger edit window. | ||||
""" | ||||
# This is the template for the rst2html call that produces the cleanest, | ||||
# simplest html I could find. This should help in making it easier to | ||||
# paste into the blogspot html window, though I'm still having problems | ||||
# with linebreaks there... | ||||
smithj1
|
r6229 | cmd_template = ("rst2html --link-stylesheet --no-xml-declaration " | ||
Fernando Perez
|
r6220 | "--no-generator --no-datestamp --no-source-link " | ||
"--no-toc-backlinks --no-section-numbering " | ||||
"--strip-comments ") | ||||
Anton I. Sipos
|
r6261 | cmd = "%s %s" % (cmd_template, infile) | ||
Fernando Perez
|
r6220 | proc = subprocess.Popen(cmd, | ||
stdout=subprocess.PIPE, | ||||
stderr=subprocess.PIPE, | ||||
shell=True) | ||||
html, stderr = proc.communicate() | ||||
if stderr: | ||||
raise IOError(stderr) | ||||
# Make an iterator so breaking out holds state. Our implementation of | ||||
# searching for the html body below is basically a trivial little state | ||||
# machine, so we need this. | ||||
walker = iter(html.splitlines()) | ||||
# Find start of main text, break out to then print until we find end /div. | ||||
# This may only work if there's a real title defined so we get a 'div class' | ||||
# tag, I haven't really tried. | ||||
for line in walker: | ||||
smithj1
|
r6228 | if line.startswith('<body>'): | ||
Fernando Perez
|
r6220 | break | ||
Anton I. Sipos
|
r6261 | newfname = os.path.splitext(infile)[0] + '.html' | ||
Fernando Perez
|
r6220 | with open(newfname, 'w') as f: | ||
for line in walker: | ||||
smithj1
|
r6228 | if line.startswith('</body>'): | ||
Fernando Perez
|
r6220 | break | ||
f.write(line) | ||||
f.write('\n') | ||||
Anton I. Sipos
|
r6253 | |||
Fernando Perez
|
r6220 | return newfname | ||
Fernando Perez
|
r6671 | known_formats = "rst (default), html, quick-html, latex" | ||
Fernando Perez
|
r6220 | |||
Anton I. Sipos
|
r6261 | def main(infile, format='rst'): | ||
Fernando Perez
|
r6220 | """Convert a notebook to html in one step""" | ||
Paul Ivanov
|
r6280 | # XXX: this is just quick and dirty for now. When adding a new format, | ||
# make sure to add it to the `known_formats` string above, which gets | ||||
# printed in in the catch-all else, as well as in the help | ||||
Anton I. Sipos
|
r6261 | if format == 'rst': | ||
converter = ConverterRST(infile) | ||||
converter.render() | ||||
elif format == 'html': | ||||
#Currently, conversion to html is a 2 step process, nb->rst->html | ||||
converter = ConverterRST(infile) | ||||
rstfname = converter.render() | ||||
rst2simplehtml(rstfname) | ||||
Paul Ivanov
|
r6267 | elif format == 'quick-html': | ||
converter = ConverterQuickHTML(infile) | ||||
rstfname = converter.render() | ||||
Fernando Perez
|
r6671 | elif format == 'latex': | ||
converter = ConverterLaTeX(infile) | ||||
latexfname = converter.render() | ||||
Paul Ivanov
|
r6280 | else: | ||
raise SystemExit("Unknown format '%s', " % format + | ||||
"known formats are: " + known_formats) | ||||
Fernando Perez
|
r6220 | |||
Fernando Perez
|
r6677 | #----------------------------------------------------------------------------- | ||
# Script main | ||||
#----------------------------------------------------------------------------- | ||||
Anton I. Sipos
|
r6261 | |||
Paul Ivanov
|
r6280 | if __name__ == '__main__': | ||
parser = argparse.ArgumentParser(description=__doc__, | ||||
formatter_class=argparse.RawTextHelpFormatter) | ||||
Anton I. Sipos
|
r6261 | # TODO: consider passing file like object around, rather than filenames | ||
# would allow us to process stdin, or even http streams | ||||
#parser.add_argument('infile', nargs='?', type=argparse.FileType('r'), default=sys.stdin) | ||||
#Require a filename as a positional argument | ||||
parser.add_argument('infile', nargs=1) | ||||
Anton I. Sipos
|
r6265 | parser.add_argument('-f', '--format', default='rst', | ||
Paul Ivanov
|
r6280 | help='Output format. Supported formats: \n' + | ||
known_formats) | ||||
Anton I. Sipos
|
r6261 | args = parser.parse_args() | ||
main(infile=args.infile[0], format=args.format) | ||||