Show More
@@ -1,120 +1,162 b'' | |||||
1 | """Module containing a preprocessor that removes the outputs from code cells""" |
|
1 | """Module containing a preprocessor that removes the outputs from code cells""" | |
2 |
|
2 | |||
3 | # Copyright (c) IPython Development Team. |
|
3 | # Copyright (c) IPython Development Team. | |
4 | # Distributed under the terms of the Modified BSD License. |
|
4 | # Distributed under the terms of the Modified BSD License. | |
5 |
|
5 | |||
6 | #----------------------------------------------------------------------------- |
|
|||
7 | # Imports |
|
|||
8 | #----------------------------------------------------------------------------- |
|
|||
9 |
|
||||
10 | import os |
|
6 | import os | |
11 | import sys |
|
7 | import sys | |
12 |
|
8 | |||
13 | try: |
|
9 | try: | |
14 | from queue import Empty # Py 3 |
|
10 | from queue import Empty # Py 3 | |
15 | except ImportError: |
|
11 | except ImportError: | |
16 | from Queue import Empty # Py 2 |
|
12 | from Queue import Empty # Py 2 | |
17 |
|
13 | |||
18 | from IPython.kernel import KernelManager |
|
14 | from IPython.utils.traitlets import List, Unicode | |
19 | from IPython.nbformat.current import reads, NotebookNode, writes |
|
|||
20 |
|
15 | |||
|
16 | from IPython.nbformat.current import reads, NotebookNode, writes | |||
21 | from .base import Preprocessor |
|
17 | from .base import Preprocessor | |
22 |
|
18 | |||
|
19 | # default timeout for reply and output: 10s | |||
|
20 | TIMEOUT = 10 | |||
23 |
|
21 | |||
24 | #----------------------------------------------------------------------------- |
|
|||
25 | # Classes |
|
|||
26 | #----------------------------------------------------------------------------- |
|
|||
27 | class ExecutePreprocessor(Preprocessor): |
|
22 | class ExecutePreprocessor(Preprocessor): | |
28 | """ |
|
23 | """ | |
29 | Executes all the cells in a notebook |
|
24 | Executes all the cells in a notebook | |
30 | """ |
|
25 | """ | |
31 | def __init__(self, extra_arguments=[], **kwargs): |
|
26 | ||
32 | """ |
|
27 | # FIXME: to be removed with nbformat v4 | |
33 | Start an kernel to run the Python code |
|
28 | # map msg_type to v3 output_type | |
34 | """ |
|
29 | msg_type_map = { | |
35 | super(ExecutePreprocessor, self).__init__(**kwargs) |
|
30 | "error" : "pyerr", | |
36 | self.extra_arguments = [] |
|
31 | "execute_result" : "pyout", | |
|
32 | } | |||
|
33 | ||||
|
34 | # FIXME: to be removed with nbformat v4 | |||
|
35 | # map mime-type to v3 mime-type keys | |||
|
36 | mime_map = { | |||
|
37 | "text/plain" : "text", | |||
|
38 | "text/html" : "html", | |||
|
39 | "image/svg+xml" : "svg", | |||
|
40 | "image/png" : "png", | |||
|
41 | "image/jpeg" : "jpeg", | |||
|
42 | "text/latex" : "latex", | |||
|
43 | "application/json" : "json", | |||
|
44 | "application/javascript" : "javascript", | |||
|
45 | } | |||
|
46 | ||||
|
47 | extra_arguments = List(Unicode) | |||
37 |
|
48 | |||
38 | def _create_client(self): |
|
49 | def _create_client(self): | |
|
50 | from IPython.kernel import KernelManager | |||
39 | self.km = KernelManager() |
|
51 | self.km = KernelManager() | |
40 | self.km.start_kernel(extra_arguments=self.extra_arguments, stderr=open(os.devnull, 'w')) |
|
52 | self.km.start_kernel(extra_arguments=self.extra_arguments, stderr=open(os.devnull, 'w')) | |
41 | self.kc = self.km.client() |
|
53 | self.kc = self.km.client() | |
42 | self.kc.start_channels() |
|
54 | self.kc.start_channels() | |
|
55 | self.log.debug('kc.start_channels: %s', self.kc.session.session) | |||
43 | self.iopub = self.kc.iopub_channel |
|
56 | self.iopub = self.kc.iopub_channel | |
44 | self.shell = self.kc.shell_channel |
|
57 | self.shell = self.kc.shell_channel | |
45 | self.shell.kernel_info() |
|
58 | self.shell.kernel_info() | |
|
59 | try: | |||
|
60 | self.shell.get_msg(timeout=TIMEOUT) | |||
|
61 | except Empty: | |||
|
62 | self.log.error("Timeout waiting for kernel_info reply") | |||
|
63 | raise | |||
|
64 | try: | |||
|
65 | self.iopub.get_msg(timeout=TIMEOUT) | |||
|
66 | except Empty: | |||
|
67 | self.log.warn("Timeout waiting for IOPub on startup") | |||
46 |
|
68 | |||
47 | def _shutdown_client(self): |
|
69 | def _shutdown_client(self): | |
48 | self.kc.stop_channels() |
|
70 | self.kc.stop_channels() | |
49 | self.km.shutdown_kernel() |
|
71 | self.km.shutdown_kernel() | |
50 | del self.km |
|
72 | del self.km | |
51 |
|
73 | |||
52 | def preprocess(self, nb, resources): |
|
74 | def preprocess(self, nb, resources): | |
53 | self._create_client() |
|
75 | self._create_client() | |
54 | nb, resources = super(ExecutePreprocessor, self).preprocess(nb, resources) |
|
76 | nb, resources = super(ExecutePreprocessor, self).preprocess(nb, resources) | |
55 | self._shutdown_client() |
|
77 | self._shutdown_client() | |
56 | return nb, resources |
|
78 | return nb, resources | |
57 |
|
79 | |||
58 | def preprocess_cell(self, cell, resources, cell_index): |
|
80 | def preprocess_cell(self, cell, resources, cell_index): | |
59 | """ |
|
81 | """ | |
60 | Apply a transformation on each code cell. See base.py for details. |
|
82 | Apply a transformation on each code cell. See base.py for details. | |
61 | """ |
|
83 | """ | |
62 | if cell.cell_type != 'code': |
|
84 | if cell.cell_type != 'code': | |
63 | return cell, resources |
|
85 | return cell, resources | |
64 | try: |
|
86 | try: | |
65 | outputs = self.run_cell(self.shell, self.iopub, cell) |
|
87 | outputs = self.run_cell(self.shell, self.iopub, cell) | |
66 | except Exception as e: |
|
88 | except Exception as e: | |
67 | self.log.error("failed to run cell: " + repr(e)) |
|
89 | self.log.error("failed to run cell: " + repr(e)) | |
68 | self.log.error(str(cell.input)) |
|
90 | self.log.error(str(cell.input)) | |
69 |
|
|
91 | raise | |
70 | cell.outputs = outputs |
|
92 | cell.outputs = outputs | |
71 | return cell, resources |
|
93 | return cell, resources | |
72 |
|
94 | |||
73 | @staticmethod |
|
95 | def run_cell(self, shell, iopub, cell): | |
74 | def run_cell(shell, iopub, cell): |
|
96 | msg_id = shell.execute(cell.input) | |
75 | # print cell.input |
|
97 | self.log.debug("Executing cell:\n%s", cell.input) | |
76 | shell.execute(cell.input) |
|
98 | # wait for finish, with timeout | |
77 | # wait for finish, maximum 20s |
|
99 | while True: | |
78 | shell.get_msg(timeout=20) |
|
100 | try: | |
|
101 | msg = shell.get_msg(timeout=TIMEOUT) | |||
|
102 | except Empty: | |||
|
103 | self.log.error("Timeout waiting for execute reply") | |||
|
104 | raise | |||
|
105 | if msg['parent_header'].get('msg_id') == msg_id: | |||
|
106 | break | |||
|
107 | else: | |||
|
108 | # not our reply | |||
|
109 | continue | |||
|
110 | ||||
79 | outs = [] |
|
111 | outs = [] | |
80 |
|
112 | |||
81 | while True: |
|
113 | while True: | |
82 | try: |
|
114 | try: | |
83 |
msg = iopub.get_msg(timeout= |
|
115 | msg = iopub.get_msg(timeout=TIMEOUT) | |
84 | except Empty: |
|
116 | except Empty: | |
|
117 | self.log.warn("Timeout waiting for IOPub output") | |||
85 | break |
|
118 | break | |
|
119 | if msg['parent_header'].get('msg_id') != msg_id: | |||
|
120 | # not an output from our execution | |||
|
121 | continue | |||
86 |
|
122 | |||
87 | msg_type = msg['msg_type'] |
|
123 | msg_type = msg['msg_type'] | |
|
124 | self.log.debug("output: %s", msg_type) | |||
88 | content = msg['content'] |
|
125 | content = msg['content'] | |
89 | out = NotebookNode(output_type=msg_type) |
|
126 | if msg_type == 'status': | |
|
127 | if content['execution_state'] == 'idle': | |||
|
128 | break | |||
|
129 | else: | |||
|
130 | continue | |||
|
131 | elif msg_type in {'execute_input', 'pyin'}: | |||
|
132 | continue | |||
|
133 | elif msg_type == 'clear_output': | |||
|
134 | outs = [] | |||
|
135 | continue | |||
|
136 | ||||
|
137 | out = NotebookNode(output_type=self.msg_type_map.get(msg_type, msg_type)) | |||
90 |
|
138 | |||
91 | # set the prompt number for the input and the output |
|
139 | # set the prompt number for the input and the output | |
92 | if 'execution_count' in content: |
|
140 | if 'execution_count' in content: | |
93 | cell['prompt_number'] = content['execution_count'] |
|
141 | cell['prompt_number'] = content['execution_count'] | |
94 | out.prompt_number = content['execution_count'] |
|
142 | out.prompt_number = content['execution_count'] | |
95 |
|
143 | |||
96 | if msg_type in ('status', 'pyin'): |
|
|||
97 | continue |
|
|||
98 | elif msg_type == 'clear_output': |
|
|||
99 | outs = [] |
|
|||
100 | continue |
|
|||
101 |
|
||||
102 | if msg_type == 'stream': |
|
144 | if msg_type == 'stream': | |
103 | out.stream = content['name'] |
|
145 | out.stream = content['name'] | |
104 | out.text = content['data'] |
|
146 | out.text = content['data'] | |
105 |
elif msg_type in ('display_data', ' |
|
147 | elif msg_type in ('display_data', 'execute_result'): | |
106 | out['metadata'] = content['metadata'] |
|
148 | out['metadata'] = content['metadata'] | |
107 |
for mime, data in content['data']. |
|
149 | for mime, data in content['data'].items(): | |
108 | attr = mime.split('/')[-1].lower() |
|
150 | # map mime-type keys to nbformat v3 keys | |
109 | # this gets most right, but fix svg+html, plain |
|
151 | # this will be unnecessary in nbformat v4 | |
110 | attr = attr.replace('+xml', '').replace('plain', 'text') |
|
152 | key = self.mime_map.get(mime, mime) | |
111 |
|
|
153 | out[key] = data | |
112 |
elif msg_type == ' |
|
154 | elif msg_type == 'error': | |
113 | out.ename = content['ename'] |
|
155 | out.ename = content['ename'] | |
114 | out.evalue = content['evalue'] |
|
156 | out.evalue = content['evalue'] | |
115 | out.traceback = content['traceback'] |
|
157 | out.traceback = content['traceback'] | |
116 | else: |
|
158 | else: | |
117 | self.log.error("unhandled iopub msg: " + msg_type) |
|
159 | self.log.error("unhandled iopub msg: " + msg_type) | |
118 |
|
160 | |||
119 | outs.append(out) |
|
161 | outs.append(out) | |
120 | return outs |
|
162 | return outs |
@@ -1,87 +1,86 b'' | |||||
1 | """ |
|
1 | """ | |
2 | Module with tests for the execute preprocessor. |
|
2 | Module with tests for the execute preprocessor. | |
3 | """ |
|
3 | """ | |
4 |
|
4 | |||
5 | # Copyright (c) IPython Development Team. |
|
5 | # Copyright (c) IPython Development Team. | |
6 | # Distributed under the terms of the Modified BSD License. |
|
6 | # Distributed under the terms of the Modified BSD License. | |
7 |
|
7 | |||
8 | import copy |
|
8 | import copy | |
9 | import os |
|
9 | import os | |
10 | import re |
|
10 | import re | |
11 |
|
11 | |||
12 | from IPython.nbformat import current as nbformat |
|
12 | from IPython.nbformat import current as nbformat | |
13 |
|
13 | |||
14 | from .base import PreprocessorTestsBase |
|
14 | from .base import PreprocessorTestsBase | |
15 | from ..execute import ExecutePreprocessor |
|
15 | from ..execute import ExecutePreprocessor | |
16 |
|
16 | |||
17 | from IPython.nbconvert.filters import strip_ansi |
|
17 | from IPython.nbconvert.filters import strip_ansi | |
18 |
|
18 | |||
19 |
|
19 | |||
20 | addr_pat = re.compile(r'0x[0-9a-f]{7,9}') |
|
20 | addr_pat = re.compile(r'0x[0-9a-f]{7,9}') | |
21 |
|
21 | |||
22 |
|
||||
23 | class TestExecute(PreprocessorTestsBase): |
|
22 | class TestExecute(PreprocessorTestsBase): | |
24 | """Contains test functions for execute.py""" |
|
23 | """Contains test functions for execute.py""" | |
25 |
|
24 | |||
26 | @staticmethod |
|
25 | @staticmethod | |
27 |
def normalize_ |
|
26 | def normalize_output(output): | |
28 | """ |
|
27 | """ | |
29 |
Normalizes |
|
28 | Normalizes outputs for comparison. | |
30 | """ |
|
29 | """ | |
31 |
|
|
30 | output = dict(output) | |
32 |
if 'metadata' in |
|
31 | if 'metadata' in output: | |
33 |
del |
|
32 | del output['metadata'] | |
34 |
if 'text' in |
|
33 | if 'text' in output: | |
35 |
|
|
34 | output['text'] = re.sub(addr_pat, '<HEXADDR>', output['text']) | |
36 |
if 'svg' in |
|
35 | if 'svg' in output: | |
37 |
del |
|
36 | del output['text'] | |
38 |
if 'traceback' in |
|
37 | if 'traceback' in output: | |
39 | tb = [] |
|
38 | tb = [] | |
40 |
for line in |
|
39 | for line in output['traceback']: | |
41 | tb.append(strip_ansi(line)) |
|
40 | tb.append(strip_ansi(line)) | |
42 |
|
|
41 | output['traceback'] = tb | |
43 |
|
42 | |||
44 |
return |
|
43 | return output | |
45 |
|
44 | |||
46 |
|
45 | |||
47 | def assert_notebooks_equal(self, expected, actual): |
|
46 | def assert_notebooks_equal(self, expected, actual): | |
48 | expected_cells = expected['worksheets'][0]['cells'] |
|
47 | expected_cells = expected['worksheets'][0]['cells'] | |
49 | actual_cells = actual['worksheets'][0]['cells'] |
|
48 | actual_cells = actual['worksheets'][0]['cells'] | |
50 | assert len(expected_cells) == len(actual_cells) |
|
49 | assert len(expected_cells) == len(actual_cells) | |
51 |
|
50 | |||
52 | for expected_cell, actual_cell in zip(expected_cells, actual_cells): |
|
51 | for expected_cell, actual_cell in zip(expected_cells, actual_cells): | |
53 | expected_outputs = expected_cell.get('outputs', []) |
|
52 | expected_outputs = expected_cell.get('outputs', []) | |
54 | actual_outputs = actual_cell.get('outputs', []) |
|
53 | actual_outputs = actual_cell.get('outputs', []) | |
55 |
normalized_expected_outputs = list(map(self.normalize_ |
|
54 | normalized_expected_outputs = list(map(self.normalize_output, expected_outputs)) | |
56 |
normalized_actual_outputs = list(map(self.normalize_ |
|
55 | normalized_actual_outputs = list(map(self.normalize_output, actual_outputs)) | |
57 | assert normalized_expected_outputs == normalized_actual_outputs |
|
56 | assert normalized_expected_outputs == normalized_actual_outputs | |
58 |
|
57 | |||
59 |
|
58 | |||
60 | def build_preprocessor(self): |
|
59 | def build_preprocessor(self): | |
61 | """Make an instance of a preprocessor""" |
|
60 | """Make an instance of a preprocessor""" | |
62 | preprocessor = ExecutePreprocessor() |
|
61 | preprocessor = ExecutePreprocessor() | |
63 | preprocessor.enabled = True |
|
62 | preprocessor.enabled = True | |
64 | return preprocessor |
|
63 | return preprocessor | |
65 |
|
64 | |||
66 |
|
65 | |||
67 | def test_constructor(self): |
|
66 | def test_constructor(self): | |
68 | """Can a ExecutePreprocessor be constructed?""" |
|
67 | """Can a ExecutePreprocessor be constructed?""" | |
69 | self.build_preprocessor() |
|
68 | self.build_preprocessor() | |
70 |
|
69 | |||
71 |
|
70 | |||
72 | def test_run_notebooks(self): |
|
71 | def test_run_notebooks(self): | |
73 | """Runs a series of test notebooks and compares them to their actual output""" |
|
72 | """Runs a series of test notebooks and compares them to their actual output""" | |
74 | current_dir = os.path.dirname(__file__) |
|
73 | current_dir = os.path.dirname(__file__) | |
75 | input_files = os.listdir(os.path.join(current_dir, 'input')) |
|
74 | input_files = os.listdir(os.path.join(current_dir, 'input')) | |
76 | for filename in input_files: |
|
75 | for filename in input_files: | |
77 | if not filename.endswith(".ipynb"): |
|
76 | if not filename.endswith(".ipynb"): | |
78 | continue |
|
77 | continue | |
79 | with open(os.path.join(current_dir, 'input', filename)) as f: |
|
78 | with open(os.path.join(current_dir, 'input', filename)) as f: | |
80 | input_nb = nbformat.read(f, 'ipynb') |
|
79 | input_nb = nbformat.read(f, 'ipynb') | |
81 | with open(os.path.join(current_dir, 'expected', filename)) as f: |
|
80 | with open(os.path.join(current_dir, 'expected', filename)) as f: | |
82 | expected_nb = nbformat.read(f, 'ipynb') |
|
81 | expected_nb = nbformat.read(f, 'ipynb') | |
83 | res = self.build_resources() |
|
82 | res = self.build_resources() | |
84 | preprocessor = self.build_preprocessor() |
|
83 | preprocessor = self.build_preprocessor() | |
85 | output_nb, _ = preprocessor(input_nb, res) |
|
84 | output_nb, _ = preprocessor(input_nb, res) | |
86 | self.assert_notebooks_equal(output_nb, expected_nb) |
|
85 | self.assert_notebooks_equal(output_nb, expected_nb) | |
87 |
|
86 |
General Comments 0
You need to be logged in to leave comments.
Login now