upstream/ipython Commit - r13921:93f09d85

Extract output preprocessor only extracts specified formats

Thomas Kluyver -

r13921:93f09d85

parent child

IPython/html/nbconvert/tests/test_nbconvert_handlers.py

0 +6 0

             # coding: utf-8
+            import base64
             import io
             import json
             import os
             from os.path import join as pjoin
             import shutil
             import requests
             from IPython.html.utils import url_path_join
             from IPython.html.tests.launchnotebook import NotebookTestBase, assert_http_error
             from IPython.nbformat.current import (new_notebook, write, new_worksheet,
                                                   new_heading_cell, new_code_cell,
                                                   new_output)
             class NbconvertAPI(object):
                 """Wrapper for nbconvert API calls."""
                 def __init__(self, base_url):
                     self.base_url = base_url
                 def _req(self, verb, path, body=None, params=None):
                     response = requests.request(verb,
                             url_path_join(self.base_url, 'nbconvert', path),
                             data=body, params=params,
                     )
                     response.raise_for_status()
                     return response
                 def from_file(self, format, path, name, download=False):
                     return self._req('GET', url_path_join(format, path, name),
                                      params={'download':download})
                 def from_post(self, format, nbmodel):
                     body = json.dumps(nbmodel)
                     return self._req('POST', format, body)
                 def list_formats(self):
                     return self._req('GET', '')
+            png_green_pixel = base64.encodestring(b'\x89PNG\r\n\x1a\n\x00\x00\x00\rIHDR\x00'
+            b'\x00\x00\x01\x00\x00x00\x01\x08\x02\x00\x00\x00\x90wS\xde\x00\x00\x00\x0cIDAT'
+            b'\x08\xd7c\x90\xfb\xcf\x00\x00\x02\\\x01\x1e.~d\x87\x00\x00\x00\x00IEND\xaeB`\x82')
             class APITest(NotebookTestBase):
                 def setUp(self):
                     nbdir = self.notebook_dir.name
                     if not os.path.isdir(pjoin(nbdir, 'foo')):
                         os.mkdir(pjoin(nbdir, 'foo'))
                     nb = new_notebook(name='testnb')
                     ws = new_worksheet()
                     nb.worksheets = [ws]
                     ws.cells.append(new_heading_cell(u'Created by test ³'))
                     cc1 = new_code_cell(input=u'print(2*6)')
                     cc1.outputs.append(new_output(output_text=u'12'))
+                    cc1.outputs.append(new_output(output_png=png_green_pixel, output_type='pyout'))
                     ws.cells.append(cc1)
                     with io.open(pjoin(nbdir, 'foo', 'testnb.ipynb'), 'w',
                                  encoding='utf-8') as f:
                         write(nb, f, format='ipynb')
                     self.nbconvert_api = NbconvertAPI(self.base_url())
                 def tearDown(self):
                     nbdir = self.notebook_dir.name
                     for dname in ['foo']:
                         shutil.rmtree(pjoin(nbdir, dname), ignore_errors=True)
                 def test_from_file(self):
                     r = self.nbconvert_api.from_file('html', 'foo', 'testnb.ipynb')
                     self.assertEqual(r.status_code, 200)
                     self.assertIn(u'text/html', r.headers['Content-Type'])
                     self.assertIn(u'Created by test', r.text)
                     self.assertIn(u'print', r.text)
                     r = self.nbconvert_api.from_file('python', 'foo', 'testnb.ipynb')
                     self.assertIn(u'text/x-python', r.headers['Content-Type'])
                     self.assertIn(u'print(2*6)', r.text)
                 def test_from_file_404(self):
                     with assert_http_error(404):
                         self.nbconvert_api.from_file('html', 'foo', 'thisdoesntexist.ipynb')
                 def test_from_file_download(self):
                     r = self.nbconvert_api.from_file('python', 'foo', 'testnb.ipynb', download=True)
                     content_disposition = r.headers['Content-Disposition']
                     self.assertIn('attachment', content_disposition)
                     self.assertIn('testnb.py', content_disposition)
                 def test_from_file_zip(self):
                     r = self.nbconvert_api.from_file('latex', 'foo', 'testnb.ipynb', download=True)
                     self.assertIn(u'application/zip', r.headers['Content-Type'])
                     self.assertIn(u'.zip', r.headers['Content-Disposition'])
                 def test_from_post(self):
                     nbmodel_url = url_path_join(self.base_url(), 'api/notebooks/foo/testnb.ipynb')
                     nbmodel = requests.get(nbmodel_url).json()
                     r = self.nbconvert_api.from_post(format='html', nbmodel=nbmodel)
                     self.assertEqual(r.status_code, 200)
                     self.assertIn(u'text/html', r.headers['Content-Type'])
                     self.assertIn(u'Created by test', r.text)
                     self.assertIn(u'print', r.text)
                     r = self.nbconvert_api.from_post(format='python', nbmodel=nbmodel)
                     self.assertIn(u'text/x-python', r.headers['Content-Type'])
                     self.assertIn(u'print(2*6)', r.text)
                 def test_from_post_zip(self):
                     nbmodel_url = url_path_join(self.base_url(), 'api/notebooks/foo/testnb.ipynb')
                     nbmodel = requests.get(nbmodel_url).json()
                     r = self.nbconvert_api.from_post(format='latex', nbmodel=nbmodel)
                     self.assertIn(u'application/zip', r.headers['Content-Type'])
                     self.assertIn(u'.zip', r.headers['Content-Disposition'])

IPython/nbconvert/preprocessors/extractoutput.py

0 +4 -3

             """Module containing a preprocessor that extracts all of the outputs from the
             notebook file.  The extracted outputs are returned in the 'resources' dictionary.
             """
             #-----------------------------------------------------------------------------
             # Copyright (c) 2013, the IPython Development Team.
             #
             # Distributed under the terms of the Modified BSD License.
             #
             # The full license is in the file COPYING.txt, distributed with this software.
             #-----------------------------------------------------------------------------
             #-----------------------------------------------------------------------------
             # Imports
             #-----------------------------------------------------------------------------
             import base64
             import sys
             import os
-            from IPython.utils.traitlets import Unicode
+            from IPython.utils.traitlets import Unicode, Set
             from .base import Preprocessor
             from IPython.utils import py3compat
             #-----------------------------------------------------------------------------
             # Classes
             #-----------------------------------------------------------------------------
             class ExtractOutputPreprocessor(Preprocessor):
                 """
                 Extracts all of the outputs from the notebook file.  The extracted
                 outputs are returned in the 'resources' dictionary.
                 """
                 output_filename_template = Unicode(
                     "{unique_key}_{cell_index}_{index}.{extension}", config=True)
+                extract_output_types = Set({'png', 'jpg', 'svg', 'pdf'}, config=True)
                 def preprocess_cell(self, cell, resources, cell_index):
                     """
                     Apply a transformation on each cell,
                     Parameters
                     ----------
                     cell : NotebookNode cell
                         Notebook cell being processed
                     resources : dictionary
                         Additional resources used in the conversion process.  Allows
                         preprocessors to pass variables into the Jinja engine.
                     cell_index : int
                         Index of the cell being processed (see base.py)
                     """
                     #Get the unique key from the resource dict if it exists.  If it does not
                     #exist, use 'output' as the default.  Also, get files directory if it
                     #has been specified
                     unique_key = resources.get('unique_key', 'output')
                     output_files_dir = resources.get('output_files_dir', None)
                     #Make sure outputs key exists
                     if not isinstance(resources['outputs'], dict):
                         resources['outputs'] = {}
                     #Loop through all of the outputs in the cell
                     for index, out in enumerate(cell.get('outputs', [])):
-                        #Get the output in data formats that the template is interested in.
+                        #Get the output in data formats that the template needs extracted
-                        for out_type in self.display_data_priority:
+                        for out_type in self.extract_output_types:
                             if out.hasattr(out_type):
                                 data = out[out_type]
                                 #Binary files are base64-encoded, SVG is already XML
                                 if out_type in ('png', 'jpg', 'jpeg', 'pdf'):
                                     # data is b64-encoded as text (str, unicode)
                                     # decodestring only accepts bytes
                                     data = py3compat.cast_bytes(data)
                                     data = base64.decodestring(data)
                                 elif sys.platform == 'win32':
                                     data = data.replace('\n', '\r\n').encode("UTF-8")
                                 else:
                                     data = data.encode("UTF-8")
                                 #Build an output name
                                 filename = self.output_filename_template.format(
                                                 unique_key=unique_key,
                                                 cell_index=cell_index,
                                                 index=index,
                                                 extension=out_type)
                                 #On the cell, make the figure available via
                                 #   cell.outputs[i].svg_filename  ... etc (svg in example)
                                 # Where
                                 #   cell.outputs[i].svg  contains the data
                                 if output_files_dir is not None:
                                     filename = os.path.join(output_files_dir, filename)
                                 out[out_type + '_filename'] = filename
                                 #In the resources, make the figure available via
                                 #   resources['outputs']['filename'] = data
                                 resources['outputs'][filename] = data
                     return cell, resources

IPython/nbconvert/templates/python.tpl

0 +2 -2

             {%- extends 'null.tpl' -%}
             {% block in_prompt %}
             # In[{{ cell.prompt_number if cell.prompt_number else ' ' }}]:
             {% endblock in_prompt %}
             {% block output_prompt %}
             # Out[{{ cell.prompt_number }}]:
             {% endblock output_prompt %}
             {% block input %}
             {{ cell.input | ipython2python }}
             {% endblock input %}
             {# Those Two are for error displaying
             even if the first one seem to do nothing,
             it introduces a new line
             #}
             {% block pyerr %}
             {{ super() }}
             {% endblock pyerr %}
             {% block traceback_line %}
             {{ line | indent | strip_ansi }}
             {% endblock traceback_line %}
             {# .... #}
             {% block pyout %}
-            {{ output.text | indent | comment_lines }}
+            {{ output.text or '' | indent | comment_lines }}
             {% endblock pyout %}
             {% block stream %}
             {{ output.text | indent | comment_lines }}
             {% endblock stream %}
             {% block display_data scoped %}
             # image file:
             {% endblock display_data %}
             {% block markdowncell scoped %}
             {{ cell.source | comment_lines }}
             {% endblock markdowncell %}
             {% block headingcell scoped %}
             {{ '#' * cell.level }}{{ cell.source | replace('\n', ' ') | comment_lines }}
             {% endblock headingcell %}
             {% block unknowncell scoped %}
             unknown type  {{ cell.type }}
-            {% endblock unknowncell %}
  No newline at end of file
+            {% endblock unknowncell %}

General Comments 0

Write
Preview

You need to be logged in to leave comments. Login now

No TODOs yet

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages