##// END OF EJS Templates
Backport PR #12503: try to fix doc build
Matthias Bussonnier -
Show More
@@ -1,723 +1,726 b''
1 """Input transformer machinery to support IPython special syntax.
1 """Input transformer machinery to support IPython special syntax.
2
2
3 This includes the machinery to recognise and transform ``%magic`` commands,
3 This includes the machinery to recognise and transform ``%magic`` commands,
4 ``!system`` commands, ``help?`` querying, prompt stripping, and so forth.
4 ``!system`` commands, ``help?`` querying, prompt stripping, and so forth.
5
5
6 Added: IPython 7.0. Replaces inputsplitter and inputtransformer which were
6 Added: IPython 7.0. Replaces inputsplitter and inputtransformer which were
7 deprecated in 7.0.
7 deprecated in 7.0.
8 """
8 """
9
9
10 # Copyright (c) IPython Development Team.
10 # Copyright (c) IPython Development Team.
11 # Distributed under the terms of the Modified BSD License.
11 # Distributed under the terms of the Modified BSD License.
12
12
13 from codeop import compile_command
13 from codeop import compile_command
14 import re
14 import re
15 import tokenize
15 import tokenize
16 from typing import List, Tuple, Union
16 from typing import List, Tuple, Union
17 import warnings
17 import warnings
18
18
19 _indent_re = re.compile(r'^[ \t]+')
19 _indent_re = re.compile(r'^[ \t]+')
20
20
21 def leading_empty_lines(lines):
21 def leading_empty_lines(lines):
22 """Remove leading empty lines
22 """Remove leading empty lines
23
23
24 If the leading lines are empty or contain only whitespace, they will be
24 If the leading lines are empty or contain only whitespace, they will be
25 removed.
25 removed.
26 """
26 """
27 if not lines:
27 if not lines:
28 return lines
28 return lines
29 for i, line in enumerate(lines):
29 for i, line in enumerate(lines):
30 if line and not line.isspace():
30 if line and not line.isspace():
31 return lines[i:]
31 return lines[i:]
32 return lines
32 return lines
33
33
34 def leading_indent(lines):
34 def leading_indent(lines):
35 """Remove leading indentation.
35 """Remove leading indentation.
36
36
37 If the first line starts with a spaces or tabs, the same whitespace will be
37 If the first line starts with a spaces or tabs, the same whitespace will be
38 removed from each following line in the cell.
38 removed from each following line in the cell.
39 """
39 """
40 if not lines:
40 if not lines:
41 return lines
41 return lines
42 m = _indent_re.match(lines[0])
42 m = _indent_re.match(lines[0])
43 if not m:
43 if not m:
44 return lines
44 return lines
45 space = m.group(0)
45 space = m.group(0)
46 n = len(space)
46 n = len(space)
47 return [l[n:] if l.startswith(space) else l
47 return [l[n:] if l.startswith(space) else l
48 for l in lines]
48 for l in lines]
49
49
50 class PromptStripper:
50 class PromptStripper:
51 """Remove matching input prompts from a block of input.
51 """Remove matching input prompts from a block of input.
52
52
53 Parameters
53 Parameters
54 ----------
54 ----------
55 prompt_re : regular expression
55 prompt_re : regular expression
56 A regular expression matching any input prompt (including continuation,
56 A regular expression matching any input prompt (including continuation,
57 e.g. ``...``)
57 e.g. ``...``)
58 initial_re : regular expression, optional
58 initial_re : regular expression, optional
59 A regular expression matching only the initial prompt, but not continuation.
59 A regular expression matching only the initial prompt, but not continuation.
60 If no initial expression is given, prompt_re will be used everywhere.
60 If no initial expression is given, prompt_re will be used everywhere.
61 Used mainly for plain Python prompts (``>>>``), where the continuation prompt
61 Used mainly for plain Python prompts (``>>>``), where the continuation prompt
62 ``...`` is a valid Python expression in Python 3, so shouldn't be stripped.
62 ``...`` is a valid Python expression in Python 3, so shouldn't be stripped.
63
63
64 Notes
65 -----
66
64 If initial_re and prompt_re differ,
67 If initial_re and prompt_re differ,
65 only initial_re will be tested against the first line.
68 only initial_re will be tested against the first line.
66 If any prompt is found on the first two lines,
69 If any prompt is found on the first two lines,
67 prompts will be stripped from the rest of the block.
70 prompts will be stripped from the rest of the block.
68 """
71 """
69 def __init__(self, prompt_re, initial_re=None):
72 def __init__(self, prompt_re, initial_re=None):
70 self.prompt_re = prompt_re
73 self.prompt_re = prompt_re
71 self.initial_re = initial_re or prompt_re
74 self.initial_re = initial_re or prompt_re
72
75
73 def _strip(self, lines):
76 def _strip(self, lines):
74 return [self.prompt_re.sub('', l, count=1) for l in lines]
77 return [self.prompt_re.sub('', l, count=1) for l in lines]
75
78
76 def __call__(self, lines):
79 def __call__(self, lines):
77 if not lines:
80 if not lines:
78 return lines
81 return lines
79 if self.initial_re.match(lines[0]) or \
82 if self.initial_re.match(lines[0]) or \
80 (len(lines) > 1 and self.prompt_re.match(lines[1])):
83 (len(lines) > 1 and self.prompt_re.match(lines[1])):
81 return self._strip(lines)
84 return self._strip(lines)
82 return lines
85 return lines
83
86
84 classic_prompt = PromptStripper(
87 classic_prompt = PromptStripper(
85 prompt_re=re.compile(r'^(>>>|\.\.\.)( |$)'),
88 prompt_re=re.compile(r'^(>>>|\.\.\.)( |$)'),
86 initial_re=re.compile(r'^>>>( |$)')
89 initial_re=re.compile(r'^>>>( |$)')
87 )
90 )
88
91
89 ipython_prompt = PromptStripper(re.compile(r'^(In \[\d+\]: |\s*\.{3,}: ?)'))
92 ipython_prompt = PromptStripper(re.compile(r'^(In \[\d+\]: |\s*\.{3,}: ?)'))
90
93
91 def cell_magic(lines):
94 def cell_magic(lines):
92 if not lines or not lines[0].startswith('%%'):
95 if not lines or not lines[0].startswith('%%'):
93 return lines
96 return lines
94 if re.match(r'%%\w+\?', lines[0]):
97 if re.match(r'%%\w+\?', lines[0]):
95 # This case will be handled by help_end
98 # This case will be handled by help_end
96 return lines
99 return lines
97 magic_name, _, first_line = lines[0][2:].rstrip().partition(' ')
100 magic_name, _, first_line = lines[0][2:].rstrip().partition(' ')
98 body = ''.join(lines[1:])
101 body = ''.join(lines[1:])
99 return ['get_ipython().run_cell_magic(%r, %r, %r)\n'
102 return ['get_ipython().run_cell_magic(%r, %r, %r)\n'
100 % (magic_name, first_line, body)]
103 % (magic_name, first_line, body)]
101
104
102
105
103 def _find_assign_op(token_line) -> Union[int, None]:
106 def _find_assign_op(token_line) -> Union[int, None]:
104 """Get the index of the first assignment in the line ('=' not inside brackets)
107 """Get the index of the first assignment in the line ('=' not inside brackets)
105
108
106 Note: We don't try to support multiple special assignment (a = b = %foo)
109 Note: We don't try to support multiple special assignment (a = b = %foo)
107 """
110 """
108 paren_level = 0
111 paren_level = 0
109 for i, ti in enumerate(token_line):
112 for i, ti in enumerate(token_line):
110 s = ti.string
113 s = ti.string
111 if s == '=' and paren_level == 0:
114 if s == '=' and paren_level == 0:
112 return i
115 return i
113 if s in {'(','[','{'}:
116 if s in {'(','[','{'}:
114 paren_level += 1
117 paren_level += 1
115 elif s in {')', ']', '}'}:
118 elif s in {')', ']', '}'}:
116 if paren_level > 0:
119 if paren_level > 0:
117 paren_level -= 1
120 paren_level -= 1
118
121
119 def find_end_of_continued_line(lines, start_line: int):
122 def find_end_of_continued_line(lines, start_line: int):
120 """Find the last line of a line explicitly extended using backslashes.
123 """Find the last line of a line explicitly extended using backslashes.
121
124
122 Uses 0-indexed line numbers.
125 Uses 0-indexed line numbers.
123 """
126 """
124 end_line = start_line
127 end_line = start_line
125 while lines[end_line].endswith('\\\n'):
128 while lines[end_line].endswith('\\\n'):
126 end_line += 1
129 end_line += 1
127 if end_line >= len(lines):
130 if end_line >= len(lines):
128 break
131 break
129 return end_line
132 return end_line
130
133
131 def assemble_continued_line(lines, start: Tuple[int, int], end_line: int):
134 def assemble_continued_line(lines, start: Tuple[int, int], end_line: int):
132 r"""Assemble a single line from multiple continued line pieces
135 r"""Assemble a single line from multiple continued line pieces
133
136
134 Continued lines are lines ending in ``\``, and the line following the last
137 Continued lines are lines ending in ``\``, and the line following the last
135 ``\`` in the block.
138 ``\`` in the block.
136
139
137 For example, this code continues over multiple lines::
140 For example, this code continues over multiple lines::
138
141
139 if (assign_ix is not None) \
142 if (assign_ix is not None) \
140 and (len(line) >= assign_ix + 2) \
143 and (len(line) >= assign_ix + 2) \
141 and (line[assign_ix+1].string == '%') \
144 and (line[assign_ix+1].string == '%') \
142 and (line[assign_ix+2].type == tokenize.NAME):
145 and (line[assign_ix+2].type == tokenize.NAME):
143
146
144 This statement contains four continued line pieces.
147 This statement contains four continued line pieces.
145 Assembling these pieces into a single line would give::
148 Assembling these pieces into a single line would give::
146
149
147 if (assign_ix is not None) and (len(line) >= assign_ix + 2) and (line[...
150 if (assign_ix is not None) and (len(line) >= assign_ix + 2) and (line[...
148
151
149 This uses 0-indexed line numbers. *start* is (lineno, colno).
152 This uses 0-indexed line numbers. *start* is (lineno, colno).
150
153
151 Used to allow ``%magic`` and ``!system`` commands to be continued over
154 Used to allow ``%magic`` and ``!system`` commands to be continued over
152 multiple lines.
155 multiple lines.
153 """
156 """
154 parts = [lines[start[0]][start[1]:]] + lines[start[0]+1:end_line+1]
157 parts = [lines[start[0]][start[1]:]] + lines[start[0]+1:end_line+1]
155 return ' '.join([p.rstrip()[:-1] for p in parts[:-1]] # Strip backslash+newline
158 return ' '.join([p.rstrip()[:-1] for p in parts[:-1]] # Strip backslash+newline
156 + [parts[-1].rstrip()]) # Strip newline from last line
159 + [parts[-1].rstrip()]) # Strip newline from last line
157
160
158 class TokenTransformBase:
161 class TokenTransformBase:
159 """Base class for transformations which examine tokens.
162 """Base class for transformations which examine tokens.
160
163
161 Special syntax should not be transformed when it occurs inside strings or
164 Special syntax should not be transformed when it occurs inside strings or
162 comments. This is hard to reliably avoid with regexes. The solution is to
165 comments. This is hard to reliably avoid with regexes. The solution is to
163 tokenise the code as Python, and recognise the special syntax in the tokens.
166 tokenise the code as Python, and recognise the special syntax in the tokens.
164
167
165 IPython's special syntax is not valid Python syntax, so tokenising may go
168 IPython's special syntax is not valid Python syntax, so tokenising may go
166 wrong after the special syntax starts. These classes therefore find and
169 wrong after the special syntax starts. These classes therefore find and
167 transform *one* instance of special syntax at a time into regular Python
170 transform *one* instance of special syntax at a time into regular Python
168 syntax. After each transformation, tokens are regenerated to find the next
171 syntax. After each transformation, tokens are regenerated to find the next
169 piece of special syntax.
172 piece of special syntax.
170
173
171 Subclasses need to implement one class method (find)
174 Subclasses need to implement one class method (find)
172 and one regular method (transform).
175 and one regular method (transform).
173
176
174 The priority attribute can select which transformation to apply if multiple
177 The priority attribute can select which transformation to apply if multiple
175 transformers match in the same place. Lower numbers have higher priority.
178 transformers match in the same place. Lower numbers have higher priority.
176 This allows "%magic?" to be turned into a help call rather than a magic call.
179 This allows "%magic?" to be turned into a help call rather than a magic call.
177 """
180 """
178 # Lower numbers -> higher priority (for matches in the same location)
181 # Lower numbers -> higher priority (for matches in the same location)
179 priority = 10
182 priority = 10
180
183
181 def sortby(self):
184 def sortby(self):
182 return self.start_line, self.start_col, self.priority
185 return self.start_line, self.start_col, self.priority
183
186
184 def __init__(self, start):
187 def __init__(self, start):
185 self.start_line = start[0] - 1 # Shift from 1-index to 0-index
188 self.start_line = start[0] - 1 # Shift from 1-index to 0-index
186 self.start_col = start[1]
189 self.start_col = start[1]
187
190
188 @classmethod
191 @classmethod
189 def find(cls, tokens_by_line):
192 def find(cls, tokens_by_line):
190 """Find one instance of special syntax in the provided tokens.
193 """Find one instance of special syntax in the provided tokens.
191
194
192 Tokens are grouped into logical lines for convenience,
195 Tokens are grouped into logical lines for convenience,
193 so it is easy to e.g. look at the first token of each line.
196 so it is easy to e.g. look at the first token of each line.
194 *tokens_by_line* is a list of lists of tokenize.TokenInfo objects.
197 *tokens_by_line* is a list of lists of tokenize.TokenInfo objects.
195
198
196 This should return an instance of its class, pointing to the start
199 This should return an instance of its class, pointing to the start
197 position it has found, or None if it found no match.
200 position it has found, or None if it found no match.
198 """
201 """
199 raise NotImplementedError
202 raise NotImplementedError
200
203
201 def transform(self, lines: List[str]):
204 def transform(self, lines: List[str]):
202 """Transform one instance of special syntax found by ``find()``
205 """Transform one instance of special syntax found by ``find()``
203
206
204 Takes a list of strings representing physical lines,
207 Takes a list of strings representing physical lines,
205 returns a similar list of transformed lines.
208 returns a similar list of transformed lines.
206 """
209 """
207 raise NotImplementedError
210 raise NotImplementedError
208
211
209 class MagicAssign(TokenTransformBase):
212 class MagicAssign(TokenTransformBase):
210 """Transformer for assignments from magics (a = %foo)"""
213 """Transformer for assignments from magics (a = %foo)"""
211 @classmethod
214 @classmethod
212 def find(cls, tokens_by_line):
215 def find(cls, tokens_by_line):
213 """Find the first magic assignment (a = %foo) in the cell.
216 """Find the first magic assignment (a = %foo) in the cell.
214 """
217 """
215 for line in tokens_by_line:
218 for line in tokens_by_line:
216 assign_ix = _find_assign_op(line)
219 assign_ix = _find_assign_op(line)
217 if (assign_ix is not None) \
220 if (assign_ix is not None) \
218 and (len(line) >= assign_ix + 2) \
221 and (len(line) >= assign_ix + 2) \
219 and (line[assign_ix+1].string == '%') \
222 and (line[assign_ix+1].string == '%') \
220 and (line[assign_ix+2].type == tokenize.NAME):
223 and (line[assign_ix+2].type == tokenize.NAME):
221 return cls(line[assign_ix+1].start)
224 return cls(line[assign_ix+1].start)
222
225
223 def transform(self, lines: List[str]):
226 def transform(self, lines: List[str]):
224 """Transform a magic assignment found by the ``find()`` classmethod.
227 """Transform a magic assignment found by the ``find()`` classmethod.
225 """
228 """
226 start_line, start_col = self.start_line, self.start_col
229 start_line, start_col = self.start_line, self.start_col
227 lhs = lines[start_line][:start_col]
230 lhs = lines[start_line][:start_col]
228 end_line = find_end_of_continued_line(lines, start_line)
231 end_line = find_end_of_continued_line(lines, start_line)
229 rhs = assemble_continued_line(lines, (start_line, start_col), end_line)
232 rhs = assemble_continued_line(lines, (start_line, start_col), end_line)
230 assert rhs.startswith('%'), rhs
233 assert rhs.startswith('%'), rhs
231 magic_name, _, args = rhs[1:].partition(' ')
234 magic_name, _, args = rhs[1:].partition(' ')
232
235
233 lines_before = lines[:start_line]
236 lines_before = lines[:start_line]
234 call = "get_ipython().run_line_magic({!r}, {!r})".format(magic_name, args)
237 call = "get_ipython().run_line_magic({!r}, {!r})".format(magic_name, args)
235 new_line = lhs + call + '\n'
238 new_line = lhs + call + '\n'
236 lines_after = lines[end_line+1:]
239 lines_after = lines[end_line+1:]
237
240
238 return lines_before + [new_line] + lines_after
241 return lines_before + [new_line] + lines_after
239
242
240
243
241 class SystemAssign(TokenTransformBase):
244 class SystemAssign(TokenTransformBase):
242 """Transformer for assignments from system commands (a = !foo)"""
245 """Transformer for assignments from system commands (a = !foo)"""
243 @classmethod
246 @classmethod
244 def find(cls, tokens_by_line):
247 def find(cls, tokens_by_line):
245 """Find the first system assignment (a = !foo) in the cell.
248 """Find the first system assignment (a = !foo) in the cell.
246 """
249 """
247 for line in tokens_by_line:
250 for line in tokens_by_line:
248 assign_ix = _find_assign_op(line)
251 assign_ix = _find_assign_op(line)
249 if (assign_ix is not None) \
252 if (assign_ix is not None) \
250 and not line[assign_ix].line.strip().startswith('=') \
253 and not line[assign_ix].line.strip().startswith('=') \
251 and (len(line) >= assign_ix + 2) \
254 and (len(line) >= assign_ix + 2) \
252 and (line[assign_ix + 1].type == tokenize.ERRORTOKEN):
255 and (line[assign_ix + 1].type == tokenize.ERRORTOKEN):
253 ix = assign_ix + 1
256 ix = assign_ix + 1
254
257
255 while ix < len(line) and line[ix].type == tokenize.ERRORTOKEN:
258 while ix < len(line) and line[ix].type == tokenize.ERRORTOKEN:
256 if line[ix].string == '!':
259 if line[ix].string == '!':
257 return cls(line[ix].start)
260 return cls(line[ix].start)
258 elif not line[ix].string.isspace():
261 elif not line[ix].string.isspace():
259 break
262 break
260 ix += 1
263 ix += 1
261
264
262 def transform(self, lines: List[str]):
265 def transform(self, lines: List[str]):
263 """Transform a system assignment found by the ``find()`` classmethod.
266 """Transform a system assignment found by the ``find()`` classmethod.
264 """
267 """
265 start_line, start_col = self.start_line, self.start_col
268 start_line, start_col = self.start_line, self.start_col
266
269
267 lhs = lines[start_line][:start_col]
270 lhs = lines[start_line][:start_col]
268 end_line = find_end_of_continued_line(lines, start_line)
271 end_line = find_end_of_continued_line(lines, start_line)
269 rhs = assemble_continued_line(lines, (start_line, start_col), end_line)
272 rhs = assemble_continued_line(lines, (start_line, start_col), end_line)
270 assert rhs.startswith('!'), rhs
273 assert rhs.startswith('!'), rhs
271 cmd = rhs[1:]
274 cmd = rhs[1:]
272
275
273 lines_before = lines[:start_line]
276 lines_before = lines[:start_line]
274 call = "get_ipython().getoutput({!r})".format(cmd)
277 call = "get_ipython().getoutput({!r})".format(cmd)
275 new_line = lhs + call + '\n'
278 new_line = lhs + call + '\n'
276 lines_after = lines[end_line + 1:]
279 lines_after = lines[end_line + 1:]
277
280
278 return lines_before + [new_line] + lines_after
281 return lines_before + [new_line] + lines_after
279
282
280 # The escape sequences that define the syntax transformations IPython will
283 # The escape sequences that define the syntax transformations IPython will
281 # apply to user input. These can NOT be just changed here: many regular
284 # apply to user input. These can NOT be just changed here: many regular
282 # expressions and other parts of the code may use their hardcoded values, and
285 # expressions and other parts of the code may use their hardcoded values, and
283 # for all intents and purposes they constitute the 'IPython syntax', so they
286 # for all intents and purposes they constitute the 'IPython syntax', so they
284 # should be considered fixed.
287 # should be considered fixed.
285
288
286 ESC_SHELL = '!' # Send line to underlying system shell
289 ESC_SHELL = '!' # Send line to underlying system shell
287 ESC_SH_CAP = '!!' # Send line to system shell and capture output
290 ESC_SH_CAP = '!!' # Send line to system shell and capture output
288 ESC_HELP = '?' # Find information about object
291 ESC_HELP = '?' # Find information about object
289 ESC_HELP2 = '??' # Find extra-detailed information about object
292 ESC_HELP2 = '??' # Find extra-detailed information about object
290 ESC_MAGIC = '%' # Call magic function
293 ESC_MAGIC = '%' # Call magic function
291 ESC_MAGIC2 = '%%' # Call cell-magic function
294 ESC_MAGIC2 = '%%' # Call cell-magic function
292 ESC_QUOTE = ',' # Split args on whitespace, quote each as string and call
295 ESC_QUOTE = ',' # Split args on whitespace, quote each as string and call
293 ESC_QUOTE2 = ';' # Quote all args as a single string, call
296 ESC_QUOTE2 = ';' # Quote all args as a single string, call
294 ESC_PAREN = '/' # Call first argument with rest of line as arguments
297 ESC_PAREN = '/' # Call first argument with rest of line as arguments
295
298
296 ESCAPE_SINGLES = {'!', '?', '%', ',', ';', '/'}
299 ESCAPE_SINGLES = {'!', '?', '%', ',', ';', '/'}
297 ESCAPE_DOUBLES = {'!!', '??'} # %% (cell magic) is handled separately
300 ESCAPE_DOUBLES = {'!!', '??'} # %% (cell magic) is handled separately
298
301
299 def _make_help_call(target, esc, next_input=None):
302 def _make_help_call(target, esc, next_input=None):
300 """Prepares a pinfo(2)/psearch call from a target name and the escape
303 """Prepares a pinfo(2)/psearch call from a target name and the escape
301 (i.e. ? or ??)"""
304 (i.e. ? or ??)"""
302 method = 'pinfo2' if esc == '??' \
305 method = 'pinfo2' if esc == '??' \
303 else 'psearch' if '*' in target \
306 else 'psearch' if '*' in target \
304 else 'pinfo'
307 else 'pinfo'
305 arg = " ".join([method, target])
308 arg = " ".join([method, target])
306 #Prepare arguments for get_ipython().run_line_magic(magic_name, magic_args)
309 #Prepare arguments for get_ipython().run_line_magic(magic_name, magic_args)
307 t_magic_name, _, t_magic_arg_s = arg.partition(' ')
310 t_magic_name, _, t_magic_arg_s = arg.partition(' ')
308 t_magic_name = t_magic_name.lstrip(ESC_MAGIC)
311 t_magic_name = t_magic_name.lstrip(ESC_MAGIC)
309 if next_input is None:
312 if next_input is None:
310 return 'get_ipython().run_line_magic(%r, %r)' % (t_magic_name, t_magic_arg_s)
313 return 'get_ipython().run_line_magic(%r, %r)' % (t_magic_name, t_magic_arg_s)
311 else:
314 else:
312 return 'get_ipython().set_next_input(%r);get_ipython().run_line_magic(%r, %r)' % \
315 return 'get_ipython().set_next_input(%r);get_ipython().run_line_magic(%r, %r)' % \
313 (next_input, t_magic_name, t_magic_arg_s)
316 (next_input, t_magic_name, t_magic_arg_s)
314
317
315 def _tr_help(content):
318 def _tr_help(content):
316 """Translate lines escaped with: ?
319 """Translate lines escaped with: ?
317
320
318 A naked help line should fire the intro help screen (shell.show_usage())
321 A naked help line should fire the intro help screen (shell.show_usage())
319 """
322 """
320 if not content:
323 if not content:
321 return 'get_ipython().show_usage()'
324 return 'get_ipython().show_usage()'
322
325
323 return _make_help_call(content, '?')
326 return _make_help_call(content, '?')
324
327
325 def _tr_help2(content):
328 def _tr_help2(content):
326 """Translate lines escaped with: ??
329 """Translate lines escaped with: ??
327
330
328 A naked help line should fire the intro help screen (shell.show_usage())
331 A naked help line should fire the intro help screen (shell.show_usage())
329 """
332 """
330 if not content:
333 if not content:
331 return 'get_ipython().show_usage()'
334 return 'get_ipython().show_usage()'
332
335
333 return _make_help_call(content, '??')
336 return _make_help_call(content, '??')
334
337
335 def _tr_magic(content):
338 def _tr_magic(content):
336 "Translate lines escaped with a percent sign: %"
339 "Translate lines escaped with a percent sign: %"
337 name, _, args = content.partition(' ')
340 name, _, args = content.partition(' ')
338 return 'get_ipython().run_line_magic(%r, %r)' % (name, args)
341 return 'get_ipython().run_line_magic(%r, %r)' % (name, args)
339
342
340 def _tr_quote(content):
343 def _tr_quote(content):
341 "Translate lines escaped with a comma: ,"
344 "Translate lines escaped with a comma: ,"
342 name, _, args = content.partition(' ')
345 name, _, args = content.partition(' ')
343 return '%s("%s")' % (name, '", "'.join(args.split()) )
346 return '%s("%s")' % (name, '", "'.join(args.split()) )
344
347
345 def _tr_quote2(content):
348 def _tr_quote2(content):
346 "Translate lines escaped with a semicolon: ;"
349 "Translate lines escaped with a semicolon: ;"
347 name, _, args = content.partition(' ')
350 name, _, args = content.partition(' ')
348 return '%s("%s")' % (name, args)
351 return '%s("%s")' % (name, args)
349
352
350 def _tr_paren(content):
353 def _tr_paren(content):
351 "Translate lines escaped with a slash: /"
354 "Translate lines escaped with a slash: /"
352 name, _, args = content.partition(' ')
355 name, _, args = content.partition(' ')
353 return '%s(%s)' % (name, ", ".join(args.split()))
356 return '%s(%s)' % (name, ", ".join(args.split()))
354
357
355 tr = { ESC_SHELL : 'get_ipython().system({!r})'.format,
358 tr = { ESC_SHELL : 'get_ipython().system({!r})'.format,
356 ESC_SH_CAP : 'get_ipython().getoutput({!r})'.format,
359 ESC_SH_CAP : 'get_ipython().getoutput({!r})'.format,
357 ESC_HELP : _tr_help,
360 ESC_HELP : _tr_help,
358 ESC_HELP2 : _tr_help2,
361 ESC_HELP2 : _tr_help2,
359 ESC_MAGIC : _tr_magic,
362 ESC_MAGIC : _tr_magic,
360 ESC_QUOTE : _tr_quote,
363 ESC_QUOTE : _tr_quote,
361 ESC_QUOTE2 : _tr_quote2,
364 ESC_QUOTE2 : _tr_quote2,
362 ESC_PAREN : _tr_paren }
365 ESC_PAREN : _tr_paren }
363
366
364 class EscapedCommand(TokenTransformBase):
367 class EscapedCommand(TokenTransformBase):
365 """Transformer for escaped commands like %foo, !foo, or /foo"""
368 """Transformer for escaped commands like %foo, !foo, or /foo"""
366 @classmethod
369 @classmethod
367 def find(cls, tokens_by_line):
370 def find(cls, tokens_by_line):
368 """Find the first escaped command (%foo, !foo, etc.) in the cell.
371 """Find the first escaped command (%foo, !foo, etc.) in the cell.
369 """
372 """
370 for line in tokens_by_line:
373 for line in tokens_by_line:
371 if not line:
374 if not line:
372 continue
375 continue
373 ix = 0
376 ix = 0
374 ll = len(line)
377 ll = len(line)
375 while ll > ix and line[ix].type in {tokenize.INDENT, tokenize.DEDENT}:
378 while ll > ix and line[ix].type in {tokenize.INDENT, tokenize.DEDENT}:
376 ix += 1
379 ix += 1
377 if ix >= ll:
380 if ix >= ll:
378 continue
381 continue
379 if line[ix].string in ESCAPE_SINGLES:
382 if line[ix].string in ESCAPE_SINGLES:
380 return cls(line[ix].start)
383 return cls(line[ix].start)
381
384
382 def transform(self, lines):
385 def transform(self, lines):
383 """Transform an escaped line found by the ``find()`` classmethod.
386 """Transform an escaped line found by the ``find()`` classmethod.
384 """
387 """
385 start_line, start_col = self.start_line, self.start_col
388 start_line, start_col = self.start_line, self.start_col
386
389
387 indent = lines[start_line][:start_col]
390 indent = lines[start_line][:start_col]
388 end_line = find_end_of_continued_line(lines, start_line)
391 end_line = find_end_of_continued_line(lines, start_line)
389 line = assemble_continued_line(lines, (start_line, start_col), end_line)
392 line = assemble_continued_line(lines, (start_line, start_col), end_line)
390
393
391 if len(line) > 1 and line[:2] in ESCAPE_DOUBLES:
394 if len(line) > 1 and line[:2] in ESCAPE_DOUBLES:
392 escape, content = line[:2], line[2:]
395 escape, content = line[:2], line[2:]
393 else:
396 else:
394 escape, content = line[:1], line[1:]
397 escape, content = line[:1], line[1:]
395
398
396 if escape in tr:
399 if escape in tr:
397 call = tr[escape](content)
400 call = tr[escape](content)
398 else:
401 else:
399 call = ''
402 call = ''
400
403
401 lines_before = lines[:start_line]
404 lines_before = lines[:start_line]
402 new_line = indent + call + '\n'
405 new_line = indent + call + '\n'
403 lines_after = lines[end_line + 1:]
406 lines_after = lines[end_line + 1:]
404
407
405 return lines_before + [new_line] + lines_after
408 return lines_before + [new_line] + lines_after
406
409
407 _help_end_re = re.compile(r"""(%{0,2}
410 _help_end_re = re.compile(r"""(%{0,2}
408 (?!\d)[\w*]+ # Variable name
411 (?!\d)[\w*]+ # Variable name
409 (\.(?!\d)[\w*]+)* # .etc.etc
412 (\.(?!\d)[\w*]+)* # .etc.etc
410 )
413 )
411 (\?\??)$ # ? or ??
414 (\?\??)$ # ? or ??
412 """,
415 """,
413 re.VERBOSE)
416 re.VERBOSE)
414
417
415 class HelpEnd(TokenTransformBase):
418 class HelpEnd(TokenTransformBase):
416 """Transformer for help syntax: obj? and obj??"""
419 """Transformer for help syntax: obj? and obj??"""
417 # This needs to be higher priority (lower number) than EscapedCommand so
420 # This needs to be higher priority (lower number) than EscapedCommand so
418 # that inspecting magics (%foo?) works.
421 # that inspecting magics (%foo?) works.
419 priority = 5
422 priority = 5
420
423
421 def __init__(self, start, q_locn):
424 def __init__(self, start, q_locn):
422 super().__init__(start)
425 super().__init__(start)
423 self.q_line = q_locn[0] - 1 # Shift from 1-indexed to 0-indexed
426 self.q_line = q_locn[0] - 1 # Shift from 1-indexed to 0-indexed
424 self.q_col = q_locn[1]
427 self.q_col = q_locn[1]
425
428
426 @classmethod
429 @classmethod
427 def find(cls, tokens_by_line):
430 def find(cls, tokens_by_line):
428 """Find the first help command (foo?) in the cell.
431 """Find the first help command (foo?) in the cell.
429 """
432 """
430 for line in tokens_by_line:
433 for line in tokens_by_line:
431 # Last token is NEWLINE; look at last but one
434 # Last token is NEWLINE; look at last but one
432 if len(line) > 2 and line[-2].string == '?':
435 if len(line) > 2 and line[-2].string == '?':
433 # Find the first token that's not INDENT/DEDENT
436 # Find the first token that's not INDENT/DEDENT
434 ix = 0
437 ix = 0
435 while line[ix].type in {tokenize.INDENT, tokenize.DEDENT}:
438 while line[ix].type in {tokenize.INDENT, tokenize.DEDENT}:
436 ix += 1
439 ix += 1
437 return cls(line[ix].start, line[-2].start)
440 return cls(line[ix].start, line[-2].start)
438
441
439 def transform(self, lines):
442 def transform(self, lines):
440 """Transform a help command found by the ``find()`` classmethod.
443 """Transform a help command found by the ``find()`` classmethod.
441 """
444 """
442 piece = ''.join(lines[self.start_line:self.q_line+1])
445 piece = ''.join(lines[self.start_line:self.q_line+1])
443 indent, content = piece[:self.start_col], piece[self.start_col:]
446 indent, content = piece[:self.start_col], piece[self.start_col:]
444 lines_before = lines[:self.start_line]
447 lines_before = lines[:self.start_line]
445 lines_after = lines[self.q_line + 1:]
448 lines_after = lines[self.q_line + 1:]
446
449
447 m = _help_end_re.search(content)
450 m = _help_end_re.search(content)
448 if not m:
451 if not m:
449 raise SyntaxError(content)
452 raise SyntaxError(content)
450 assert m is not None, content
453 assert m is not None, content
451 target = m.group(1)
454 target = m.group(1)
452 esc = m.group(3)
455 esc = m.group(3)
453
456
454 # If we're mid-command, put it back on the next prompt for the user.
457 # If we're mid-command, put it back on the next prompt for the user.
455 next_input = None
458 next_input = None
456 if (not lines_before) and (not lines_after) \
459 if (not lines_before) and (not lines_after) \
457 and content.strip() != m.group(0):
460 and content.strip() != m.group(0):
458 next_input = content.rstrip('?\n')
461 next_input = content.rstrip('?\n')
459
462
460 call = _make_help_call(target, esc, next_input=next_input)
463 call = _make_help_call(target, esc, next_input=next_input)
461 new_line = indent + call + '\n'
464 new_line = indent + call + '\n'
462
465
463 return lines_before + [new_line] + lines_after
466 return lines_before + [new_line] + lines_after
464
467
465 def make_tokens_by_line(lines:List[str]):
468 def make_tokens_by_line(lines:List[str]):
466 """Tokenize a series of lines and group tokens by line.
469 """Tokenize a series of lines and group tokens by line.
467
470
468 The tokens for a multiline Python string or expression are grouped as one
471 The tokens for a multiline Python string or expression are grouped as one
469 line. All lines except the last lines should keep their line ending ('\\n',
472 line. All lines except the last lines should keep their line ending ('\\n',
470 '\\r\\n') for this to properly work. Use `.splitlines(keeplineending=True)`
473 '\\r\\n') for this to properly work. Use `.splitlines(keeplineending=True)`
471 for example when passing block of text to this function.
474 for example when passing block of text to this function.
472
475
473 """
476 """
474 # NL tokens are used inside multiline expressions, but also after blank
477 # NL tokens are used inside multiline expressions, but also after blank
475 # lines or comments. This is intentional - see https://bugs.python.org/issue17061
478 # lines or comments. This is intentional - see https://bugs.python.org/issue17061
476 # We want to group the former case together but split the latter, so we
479 # We want to group the former case together but split the latter, so we
477 # track parentheses level, similar to the internals of tokenize.
480 # track parentheses level, similar to the internals of tokenize.
478 NEWLINE, NL = tokenize.NEWLINE, tokenize.NL
481 NEWLINE, NL = tokenize.NEWLINE, tokenize.NL
479 tokens_by_line = [[]]
482 tokens_by_line = [[]]
480 if len(lines) > 1 and not lines[0].endswith(('\n', '\r', '\r\n', '\x0b', '\x0c')):
483 if len(lines) > 1 and not lines[0].endswith(('\n', '\r', '\r\n', '\x0b', '\x0c')):
481 warnings.warn("`make_tokens_by_line` received a list of lines which do not have lineending markers ('\\n', '\\r', '\\r\\n', '\\x0b', '\\x0c'), behavior will be unspecified")
484 warnings.warn("`make_tokens_by_line` received a list of lines which do not have lineending markers ('\\n', '\\r', '\\r\\n', '\\x0b', '\\x0c'), behavior will be unspecified")
482 parenlev = 0
485 parenlev = 0
483 try:
486 try:
484 for token in tokenize.generate_tokens(iter(lines).__next__):
487 for token in tokenize.generate_tokens(iter(lines).__next__):
485 tokens_by_line[-1].append(token)
488 tokens_by_line[-1].append(token)
486 if (token.type == NEWLINE) \
489 if (token.type == NEWLINE) \
487 or ((token.type == NL) and (parenlev <= 0)):
490 or ((token.type == NL) and (parenlev <= 0)):
488 tokens_by_line.append([])
491 tokens_by_line.append([])
489 elif token.string in {'(', '[', '{'}:
492 elif token.string in {'(', '[', '{'}:
490 parenlev += 1
493 parenlev += 1
491 elif token.string in {')', ']', '}'}:
494 elif token.string in {')', ']', '}'}:
492 if parenlev > 0:
495 if parenlev > 0:
493 parenlev -= 1
496 parenlev -= 1
494 except tokenize.TokenError:
497 except tokenize.TokenError:
495 # Input ended in a multiline string or expression. That's OK for us.
498 # Input ended in a multiline string or expression. That's OK for us.
496 pass
499 pass
497
500
498
501
499 if not tokens_by_line[-1]:
502 if not tokens_by_line[-1]:
500 tokens_by_line.pop()
503 tokens_by_line.pop()
501
504
502
505
503 return tokens_by_line
506 return tokens_by_line
504
507
505 def show_linewise_tokens(s: str):
508 def show_linewise_tokens(s: str):
506 """For investigation and debugging"""
509 """For investigation and debugging"""
507 if not s.endswith('\n'):
510 if not s.endswith('\n'):
508 s += '\n'
511 s += '\n'
509 lines = s.splitlines(keepends=True)
512 lines = s.splitlines(keepends=True)
510 for line in make_tokens_by_line(lines):
513 for line in make_tokens_by_line(lines):
511 print("Line -------")
514 print("Line -------")
512 for tokinfo in line:
515 for tokinfo in line:
513 print(" ", tokinfo)
516 print(" ", tokinfo)
514
517
515 # Arbitrary limit to prevent getting stuck in infinite loops
518 # Arbitrary limit to prevent getting stuck in infinite loops
516 TRANSFORM_LOOP_LIMIT = 500
519 TRANSFORM_LOOP_LIMIT = 500
517
520
518 class TransformerManager:
521 class TransformerManager:
519 """Applies various transformations to a cell or code block.
522 """Applies various transformations to a cell or code block.
520
523
521 The key methods for external use are ``transform_cell()``
524 The key methods for external use are ``transform_cell()``
522 and ``check_complete()``.
525 and ``check_complete()``.
523 """
526 """
524 def __init__(self):
527 def __init__(self):
525 self.cleanup_transforms = [
528 self.cleanup_transforms = [
526 leading_empty_lines,
529 leading_empty_lines,
527 leading_indent,
530 leading_indent,
528 classic_prompt,
531 classic_prompt,
529 ipython_prompt,
532 ipython_prompt,
530 ]
533 ]
531 self.line_transforms = [
534 self.line_transforms = [
532 cell_magic,
535 cell_magic,
533 ]
536 ]
534 self.token_transformers = [
537 self.token_transformers = [
535 MagicAssign,
538 MagicAssign,
536 SystemAssign,
539 SystemAssign,
537 EscapedCommand,
540 EscapedCommand,
538 HelpEnd,
541 HelpEnd,
539 ]
542 ]
540
543
541 def do_one_token_transform(self, lines):
544 def do_one_token_transform(self, lines):
542 """Find and run the transform earliest in the code.
545 """Find and run the transform earliest in the code.
543
546
544 Returns (changed, lines).
547 Returns (changed, lines).
545
548
546 This method is called repeatedly until changed is False, indicating
549 This method is called repeatedly until changed is False, indicating
547 that all available transformations are complete.
550 that all available transformations are complete.
548
551
549 The tokens following IPython special syntax might not be valid, so
552 The tokens following IPython special syntax might not be valid, so
550 the transformed code is retokenised every time to identify the next
553 the transformed code is retokenised every time to identify the next
551 piece of special syntax. Hopefully long code cells are mostly valid
554 piece of special syntax. Hopefully long code cells are mostly valid
552 Python, not using lots of IPython special syntax, so this shouldn't be
555 Python, not using lots of IPython special syntax, so this shouldn't be
553 a performance issue.
556 a performance issue.
554 """
557 """
555 tokens_by_line = make_tokens_by_line(lines)
558 tokens_by_line = make_tokens_by_line(lines)
556 candidates = []
559 candidates = []
557 for transformer_cls in self.token_transformers:
560 for transformer_cls in self.token_transformers:
558 transformer = transformer_cls.find(tokens_by_line)
561 transformer = transformer_cls.find(tokens_by_line)
559 if transformer:
562 if transformer:
560 candidates.append(transformer)
563 candidates.append(transformer)
561
564
562 if not candidates:
565 if not candidates:
563 # Nothing to transform
566 # Nothing to transform
564 return False, lines
567 return False, lines
565 ordered_transformers = sorted(candidates, key=TokenTransformBase.sortby)
568 ordered_transformers = sorted(candidates, key=TokenTransformBase.sortby)
566 for transformer in ordered_transformers:
569 for transformer in ordered_transformers:
567 try:
570 try:
568 return True, transformer.transform(lines)
571 return True, transformer.transform(lines)
569 except SyntaxError:
572 except SyntaxError:
570 pass
573 pass
571 return False, lines
574 return False, lines
572
575
573 def do_token_transforms(self, lines):
576 def do_token_transforms(self, lines):
574 for _ in range(TRANSFORM_LOOP_LIMIT):
577 for _ in range(TRANSFORM_LOOP_LIMIT):
575 changed, lines = self.do_one_token_transform(lines)
578 changed, lines = self.do_one_token_transform(lines)
576 if not changed:
579 if not changed:
577 return lines
580 return lines
578
581
579 raise RuntimeError("Input transformation still changing after "
582 raise RuntimeError("Input transformation still changing after "
580 "%d iterations. Aborting." % TRANSFORM_LOOP_LIMIT)
583 "%d iterations. Aborting." % TRANSFORM_LOOP_LIMIT)
581
584
582 def transform_cell(self, cell: str) -> str:
585 def transform_cell(self, cell: str) -> str:
583 """Transforms a cell of input code"""
586 """Transforms a cell of input code"""
584 if not cell.endswith('\n'):
587 if not cell.endswith('\n'):
585 cell += '\n' # Ensure the cell has a trailing newline
588 cell += '\n' # Ensure the cell has a trailing newline
586 lines = cell.splitlines(keepends=True)
589 lines = cell.splitlines(keepends=True)
587 for transform in self.cleanup_transforms + self.line_transforms:
590 for transform in self.cleanup_transforms + self.line_transforms:
588 lines = transform(lines)
591 lines = transform(lines)
589
592
590 lines = self.do_token_transforms(lines)
593 lines = self.do_token_transforms(lines)
591 return ''.join(lines)
594 return ''.join(lines)
592
595
593 def check_complete(self, cell: str):
596 def check_complete(self, cell: str):
594 """Return whether a block of code is ready to execute, or should be continued
597 """Return whether a block of code is ready to execute, or should be continued
595
598
596 Parameters
599 Parameters
597 ----------
600 ----------
598 source : string
601 source : string
599 Python input code, which can be multiline.
602 Python input code, which can be multiline.
600
603
601 Returns
604 Returns
602 -------
605 -------
603 status : str
606 status : str
604 One of 'complete', 'incomplete', or 'invalid' if source is not a
607 One of 'complete', 'incomplete', or 'invalid' if source is not a
605 prefix of valid code.
608 prefix of valid code.
606 indent_spaces : int or None
609 indent_spaces : int or None
607 The number of spaces by which to indent the next line of code. If
610 The number of spaces by which to indent the next line of code. If
608 status is not 'incomplete', this is None.
611 status is not 'incomplete', this is None.
609 """
612 """
610 # Remember if the lines ends in a new line.
613 # Remember if the lines ends in a new line.
611 ends_with_newline = False
614 ends_with_newline = False
612 for character in reversed(cell):
615 for character in reversed(cell):
613 if character == '\n':
616 if character == '\n':
614 ends_with_newline = True
617 ends_with_newline = True
615 break
618 break
616 elif character.strip():
619 elif character.strip():
617 break
620 break
618 else:
621 else:
619 continue
622 continue
620
623
621 if not ends_with_newline:
624 if not ends_with_newline:
622 # Append an newline for consistent tokenization
625 # Append an newline for consistent tokenization
623 # See https://bugs.python.org/issue33899
626 # See https://bugs.python.org/issue33899
624 cell += '\n'
627 cell += '\n'
625
628
626 lines = cell.splitlines(keepends=True)
629 lines = cell.splitlines(keepends=True)
627
630
628 if not lines:
631 if not lines:
629 return 'complete', None
632 return 'complete', None
630
633
631 if lines[-1].endswith('\\'):
634 if lines[-1].endswith('\\'):
632 # Explicit backslash continuation
635 # Explicit backslash continuation
633 return 'incomplete', find_last_indent(lines)
636 return 'incomplete', find_last_indent(lines)
634
637
635 try:
638 try:
636 for transform in self.cleanup_transforms:
639 for transform in self.cleanup_transforms:
637 if not getattr(transform, 'has_side_effects', False):
640 if not getattr(transform, 'has_side_effects', False):
638 lines = transform(lines)
641 lines = transform(lines)
639 except SyntaxError:
642 except SyntaxError:
640 return 'invalid', None
643 return 'invalid', None
641
644
642 if lines[0].startswith('%%'):
645 if lines[0].startswith('%%'):
643 # Special case for cell magics - completion marked by blank line
646 # Special case for cell magics - completion marked by blank line
644 if lines[-1].strip():
647 if lines[-1].strip():
645 return 'incomplete', find_last_indent(lines)
648 return 'incomplete', find_last_indent(lines)
646 else:
649 else:
647 return 'complete', None
650 return 'complete', None
648
651
649 try:
652 try:
650 for transform in self.line_transforms:
653 for transform in self.line_transforms:
651 if not getattr(transform, 'has_side_effects', False):
654 if not getattr(transform, 'has_side_effects', False):
652 lines = transform(lines)
655 lines = transform(lines)
653 lines = self.do_token_transforms(lines)
656 lines = self.do_token_transforms(lines)
654 except SyntaxError:
657 except SyntaxError:
655 return 'invalid', None
658 return 'invalid', None
656
659
657 tokens_by_line = make_tokens_by_line(lines)
660 tokens_by_line = make_tokens_by_line(lines)
658
661
659 if not tokens_by_line:
662 if not tokens_by_line:
660 return 'incomplete', find_last_indent(lines)
663 return 'incomplete', find_last_indent(lines)
661
664
662 if tokens_by_line[-1][-1].type != tokenize.ENDMARKER:
665 if tokens_by_line[-1][-1].type != tokenize.ENDMARKER:
663 # We're in a multiline string or expression
666 # We're in a multiline string or expression
664 return 'incomplete', find_last_indent(lines)
667 return 'incomplete', find_last_indent(lines)
665
668
666 newline_types = {tokenize.NEWLINE, tokenize.COMMENT, tokenize.ENDMARKER}
669 newline_types = {tokenize.NEWLINE, tokenize.COMMENT, tokenize.ENDMARKER}
667
670
668 # Pop the last line which only contains DEDENTs and ENDMARKER
671 # Pop the last line which only contains DEDENTs and ENDMARKER
669 last_token_line = None
672 last_token_line = None
670 if {t.type for t in tokens_by_line[-1]} in [
673 if {t.type for t in tokens_by_line[-1]} in [
671 {tokenize.DEDENT, tokenize.ENDMARKER},
674 {tokenize.DEDENT, tokenize.ENDMARKER},
672 {tokenize.ENDMARKER}
675 {tokenize.ENDMARKER}
673 ] and len(tokens_by_line) > 1:
676 ] and len(tokens_by_line) > 1:
674 last_token_line = tokens_by_line.pop()
677 last_token_line = tokens_by_line.pop()
675
678
676 while tokens_by_line[-1] and tokens_by_line[-1][-1].type in newline_types:
679 while tokens_by_line[-1] and tokens_by_line[-1][-1].type in newline_types:
677 tokens_by_line[-1].pop()
680 tokens_by_line[-1].pop()
678
681
679 if not tokens_by_line[-1]:
682 if not tokens_by_line[-1]:
680 return 'incomplete', find_last_indent(lines)
683 return 'incomplete', find_last_indent(lines)
681
684
682 if tokens_by_line[-1][-1].string == ':':
685 if tokens_by_line[-1][-1].string == ':':
683 # The last line starts a block (e.g. 'if foo:')
686 # The last line starts a block (e.g. 'if foo:')
684 ix = 0
687 ix = 0
685 while tokens_by_line[-1][ix].type in {tokenize.INDENT, tokenize.DEDENT}:
688 while tokens_by_line[-1][ix].type in {tokenize.INDENT, tokenize.DEDENT}:
686 ix += 1
689 ix += 1
687
690
688 indent = tokens_by_line[-1][ix].start[1]
691 indent = tokens_by_line[-1][ix].start[1]
689 return 'incomplete', indent + 4
692 return 'incomplete', indent + 4
690
693
691 if tokens_by_line[-1][0].line.endswith('\\'):
694 if tokens_by_line[-1][0].line.endswith('\\'):
692 return 'incomplete', None
695 return 'incomplete', None
693
696
694 # At this point, our checks think the code is complete (or invalid).
697 # At this point, our checks think the code is complete (or invalid).
695 # We'll use codeop.compile_command to check this with the real parser
698 # We'll use codeop.compile_command to check this with the real parser
696 try:
699 try:
697 with warnings.catch_warnings():
700 with warnings.catch_warnings():
698 warnings.simplefilter('error', SyntaxWarning)
701 warnings.simplefilter('error', SyntaxWarning)
699 res = compile_command(''.join(lines), symbol='exec')
702 res = compile_command(''.join(lines), symbol='exec')
700 except (SyntaxError, OverflowError, ValueError, TypeError,
703 except (SyntaxError, OverflowError, ValueError, TypeError,
701 MemoryError, SyntaxWarning):
704 MemoryError, SyntaxWarning):
702 return 'invalid', None
705 return 'invalid', None
703 else:
706 else:
704 if res is None:
707 if res is None:
705 return 'incomplete', find_last_indent(lines)
708 return 'incomplete', find_last_indent(lines)
706
709
707 if last_token_line and last_token_line[0].type == tokenize.DEDENT:
710 if last_token_line and last_token_line[0].type == tokenize.DEDENT:
708 if ends_with_newline:
711 if ends_with_newline:
709 return 'complete', None
712 return 'complete', None
710 return 'incomplete', find_last_indent(lines)
713 return 'incomplete', find_last_indent(lines)
711
714
712 # If there's a blank line at the end, assume we're ready to execute
715 # If there's a blank line at the end, assume we're ready to execute
713 if not lines[-1].strip():
716 if not lines[-1].strip():
714 return 'complete', None
717 return 'complete', None
715
718
716 return 'complete', None
719 return 'complete', None
717
720
718
721
719 def find_last_indent(lines):
722 def find_last_indent(lines):
720 m = _indent_re.match(lines[-1])
723 m = _indent_re.match(lines[-1])
721 if not m:
724 if not m:
722 return 0
725 return 0
723 return len(m.group(0).replace('\t', ' '*4))
726 return len(m.group(0).replace('\t', ' '*4))
General Comments 0
You need to be logged in to leave comments. Login now