upstream/ipython Commit - r25962:36e740d9

1

"""Input transformer machinery to support IPython special syntax.

1

"""Input transformer machinery to support IPython special syntax.

2

3

This includes the machinery to recognise and transform ``%magic`` commands,

3

This includes the machinery to recognise and transform ``%magic`` commands,

4

``!system`` commands, ``help?`` querying, prompt stripping, and so forth.

4

``!system`` commands, ``help?`` querying, prompt stripping, and so forth.

5

6

Added: IPython 7.0. Replaces inputsplitter and inputtransformer which were

6

Added: IPython 7.0. Replaces inputsplitter and inputtransformer which were

7

deprecated in 7.0.

7

deprecated in 7.0.

8

"""

8

"""

9

10

# Copyright (c) IPython Development Team.

10

# Copyright (c) IPython Development Team.

11

# Distributed under the terms of the Modified BSD License.

11

# Distributed under the terms of the Modified BSD License.

12

13

from codeop import compile_command

13

from codeop import compile_command

14

import re

14

import re

15

import tokenize

15

import tokenize

16

from typing import List, Tuple, Union

16

from typing import List, Tuple, Union

17

import warnings

17

import warnings

18

19

_indent_re = re.compile(r'^[ \t]+')

19

_indent_re = re.compile(r'^[ \t]+')

20

21

def leading_empty_lines(lines):

21

def leading_empty_lines(lines):

22

"""Remove leading empty lines

22

"""Remove leading empty lines

23

24

If the leading lines are empty or contain only whitespace, they will be

24

If the leading lines are empty or contain only whitespace, they will be

25

removed.

25

removed.

26

"""

26

"""

27

if not lines:

27

if not lines:

28

return lines

28

return lines

29

for i, line in enumerate(lines):

29

for i, line in enumerate(lines):

30

if line and not line.isspace():

30

if line and not line.isspace():

31

return lines[i:]

31

return lines[i:]

32

return lines

32

return lines

33

34

def leading_indent(lines):

34

def leading_indent(lines):

35

"""Remove leading indentation.

35

"""Remove leading indentation.

36

37

If the first line starts with a spaces or tabs, the same whitespace will be

37

If the first line starts with a spaces or tabs, the same whitespace will be

38

removed from each following line in the cell.

38

removed from each following line in the cell.

39

"""

39

"""

40

if not lines:

40

if not lines:

41

return lines

41

return lines

42

m = _indent_re.match(lines[0])

42

m = _indent_re.match(lines[0])

43

if not m:

43

if not m:

44

return lines

44

return lines

45

space = m.group(0)

45

space = m.group(0)

46

n = len(space)

46

n = len(space)

47

return [l[n:] if l.startswith(space) else l

47

return [l[n:] if l.startswith(space) else l

48

for l in lines]

48

for l in lines]

49

50

class PromptStripper:

50

class PromptStripper:

51

"""Remove matching input prompts from a block of input.

51

"""Remove matching input prompts from a block of input.

52

53

Parameters

53

Parameters

54

----------

54

----------

55

prompt_re : regular expression

55

prompt_re : regular expression

56

A regular expression matching any input prompt (including continuation,

56

A regular expression matching any input prompt (including continuation,

57

e.g. ``...``)

57

e.g. ``...``)

58

initial_re : regular expression, optional

58

initial_re : regular expression, optional

59

A regular expression matching only the initial prompt, but not continuation.

59

A regular expression matching only the initial prompt, but not continuation.

60

If no initial expression is given, prompt_re will be used everywhere.

60

If no initial expression is given, prompt_re will be used everywhere.

61

Used mainly for plain Python prompts (``>>>``), where the continuation prompt

61

Used mainly for plain Python prompts (``>>>``), where the continuation prompt

62

``...`` is a valid Python expression in Python 3, so shouldn't be stripped.

62

``...`` is a valid Python expression in Python 3, so shouldn't be stripped.

63

64

Notes

65

-----

66

64

If initial_re and prompt_re differ,

67

If initial_re and prompt_re differ,

65

only initial_re will be tested against the first line.

68

only initial_re will be tested against the first line.

66

If any prompt is found on the first two lines,

69

If any prompt is found on the first two lines,

67

prompts will be stripped from the rest of the block.

70

prompts will be stripped from the rest of the block.

68

"""

71

"""

69

def __init__(self, prompt_re, initial_re=None):

72

def __init__(self, prompt_re, initial_re=None):

70

self.prompt_re = prompt_re

73

self.prompt_re = prompt_re

71

self.initial_re = initial_re or prompt_re

74

self.initial_re = initial_re or prompt_re

72

75

73

def _strip(self, lines):

76

def _strip(self, lines):

74

return [self.prompt_re.sub('', l, count=1) for l in lines]

77

return [self.prompt_re.sub('', l, count=1) for l in lines]

75

78

76

def __call__(self, lines):

79

def __call__(self, lines):

77

if not lines:

80

if not lines:

78

return lines

81

return lines

79

if self.initial_re.match(lines[0]) or \

82

if self.initial_re.match(lines[0]) or \

80

(len(lines) > 1 and self.prompt_re.match(lines[1])):

83

(len(lines) > 1 and self.prompt_re.match(lines[1])):

81

return self._strip(lines)

84

return self._strip(lines)

82

return lines

85

return lines

83

86

84

classic_prompt = PromptStripper(

87

classic_prompt = PromptStripper(

85

prompt_re=re.compile(r'^(>>>|\.\.\.)( |$)'),

88

prompt_re=re.compile(r'^(>>>|\.\.\.)( |$)'),

86

initial_re=re.compile(r'^>>>( |$)')

89

initial_re=re.compile(r'^>>>( |$)')

87

)

90

)

88

91

89

ipython_prompt = PromptStripper(re.compile(r'^(In \[\d+\]: |\s*\.{3,}: ?)'))

92

ipython_prompt = PromptStripper(re.compile(r'^(In \[\d+\]: |\s*\.{3,}: ?)'))

90

93

91

def cell_magic(lines):

94

def cell_magic(lines):

92

if not lines or not lines[0].startswith('%%'):

95

if not lines or not lines[0].startswith('%%'):

93

return lines

96

return lines

94

if re.match(r'%%\w+\?', lines[0]):

97

if re.match(r'%%\w+\?', lines[0]):

95

# This case will be handled by help_end

98

# This case will be handled by help_end

96

return lines

99

return lines

97

magic_name, _, first_line = lines[0][2:].rstrip().partition(' ')

100

magic_name, _, first_line = lines[0][2:].rstrip().partition(' ')

98

body = ''.join(lines[1:])

101

body = ''.join(lines[1:])

99

return ['get_ipython().run_cell_magic(%r, %r, %r)\n'

102

return ['get_ipython().run_cell_magic(%r, %r, %r)\n'

100

% (magic_name, first_line, body)]

103

% (magic_name, first_line, body)]

101

104

102

105

103

def _find_assign_op(token_line) -> Union[int, None]:

106

def _find_assign_op(token_line) -> Union[int, None]:

104

"""Get the index of the first assignment in the line ('=' not inside brackets)

107

"""Get the index of the first assignment in the line ('=' not inside brackets)

105

108

106

Note: We don't try to support multiple special assignment (a = b = %foo)

109

Note: We don't try to support multiple special assignment (a = b = %foo)

107

"""

110

"""

108

paren_level = 0

111

paren_level = 0

109

for i, ti in enumerate(token_line):

112

for i, ti in enumerate(token_line):

110

s = ti.string

113

s = ti.string

111

if s == '=' and paren_level == 0:

114

if s == '=' and paren_level == 0:

112

return i

115

return i

113

if s in {'(','[','{'}:

116

if s in {'(','[','{'}:

114

paren_level += 1

117

paren_level += 1

115

elif s in {')', ']', '}'}:

118

elif s in {')', ']', '}'}:

116

if paren_level > 0:

119

if paren_level > 0:

117

paren_level -= 1

120

paren_level -= 1

118

121

119

def find_end_of_continued_line(lines, start_line: int):

122

def find_end_of_continued_line(lines, start_line: int):

120

"""Find the last line of a line explicitly extended using backslashes.

123

"""Find the last line of a line explicitly extended using backslashes.

121

124

122

Uses 0-indexed line numbers.

125

Uses 0-indexed line numbers.

123

"""

126

"""

124

end_line = start_line

127

end_line = start_line

125

while lines[end_line].endswith('\\\n'):

128

while lines[end_line].endswith('\\\n'):

126

end_line += 1

129

end_line += 1

127

if end_line >= len(lines):

130

if end_line >= len(lines):

128

break

131

break

129

return end_line

132

return end_line

130

133

131

def assemble_continued_line(lines, start: Tuple[int, int], end_line: int):

134

def assemble_continued_line(lines, start: Tuple[int, int], end_line: int):

132

r"""Assemble a single line from multiple continued line pieces

135

r"""Assemble a single line from multiple continued line pieces

133

136

134

Continued lines are lines ending in ``\``, and the line following the last

137

Continued lines are lines ending in ``\``, and the line following the last

135

``\`` in the block.

138

``\`` in the block.

136

139

137

For example, this code continues over multiple lines::

140

For example, this code continues over multiple lines::

138

141

139

if (assign_ix is not None) \

142

if (assign_ix is not None) \

140

and (len(line) >= assign_ix + 2) \

143

and (len(line) >= assign_ix + 2) \

141

and (line[assign_ix+1].string == '%') \

144

and (line[assign_ix+1].string == '%') \

142

and (line[assign_ix+2].type == tokenize.NAME):

145

and (line[assign_ix+2].type == tokenize.NAME):

143

146

144

This statement contains four continued line pieces.

147

This statement contains four continued line pieces.

145

Assembling these pieces into a single line would give::

148

Assembling these pieces into a single line would give::

146

149

147

if (assign_ix is not None) and (len(line) >= assign_ix + 2) and (line[...

150

if (assign_ix is not None) and (len(line) >= assign_ix + 2) and (line[...

148

151

149

This uses 0-indexed line numbers. *start* is (lineno, colno).

152

This uses 0-indexed line numbers. *start* is (lineno, colno).

150

153

151

Used to allow ``%magic`` and ``!system`` commands to be continued over

154

Used to allow ``%magic`` and ``!system`` commands to be continued over

152

multiple lines.

155

multiple lines.

153

"""

156

"""

154

parts = [lines[start[0]][start[1]:]] + lines[start[0]+1:end_line+1]

157

parts = [lines[start[0]][start[1]:]] + lines[start[0]+1:end_line+1]

155

return ' '.join([p.rstrip()[:-1] for p in parts[:-1]] # Strip backslash+newline

158

return ' '.join([p.rstrip()[:-1] for p in parts[:-1]] # Strip backslash+newline

156

+ [parts[-1].rstrip()]) # Strip newline from last line

159

+ [parts[-1].rstrip()]) # Strip newline from last line

157

160

158

class TokenTransformBase:

161

class TokenTransformBase:

159

"""Base class for transformations which examine tokens.

162

"""Base class for transformations which examine tokens.

160

163

161

Special syntax should not be transformed when it occurs inside strings or

164

Special syntax should not be transformed when it occurs inside strings or

162

comments. This is hard to reliably avoid with regexes. The solution is to

165

comments. This is hard to reliably avoid with regexes. The solution is to

163

tokenise the code as Python, and recognise the special syntax in the tokens.

166

tokenise the code as Python, and recognise the special syntax in the tokens.

164

167

165

IPython's special syntax is not valid Python syntax, so tokenising may go

168

IPython's special syntax is not valid Python syntax, so tokenising may go

166

wrong after the special syntax starts. These classes therefore find and

169

wrong after the special syntax starts. These classes therefore find and

167

transform *one* instance of special syntax at a time into regular Python

170

transform *one* instance of special syntax at a time into regular Python

168

syntax. After each transformation, tokens are regenerated to find the next

171

syntax. After each transformation, tokens are regenerated to find the next

169

piece of special syntax.

172

piece of special syntax.

170

173

171

Subclasses need to implement one class method (find)

174

Subclasses need to implement one class method (find)

172

and one regular method (transform).

175

and one regular method (transform).

173

176

174

The priority attribute can select which transformation to apply if multiple

177

The priority attribute can select which transformation to apply if multiple

175

transformers match in the same place. Lower numbers have higher priority.

178

transformers match in the same place. Lower numbers have higher priority.

176

This allows "%magic?" to be turned into a help call rather than a magic call.

179

This allows "%magic?" to be turned into a help call rather than a magic call.

177

"""

180

"""

178

# Lower numbers -> higher priority (for matches in the same location)

181

# Lower numbers -> higher priority (for matches in the same location)

179

priority = 10

182

priority = 10

180

183

181

def sortby(self):

184

def sortby(self):

182

return self.start_line, self.start_col, self.priority

185

return self.start_line, self.start_col, self.priority

183

186

184

def __init__(self, start):

187

def __init__(self, start):

185

self.start_line = start[0] - 1 # Shift from 1-index to 0-index

188

self.start_line = start[0] - 1 # Shift from 1-index to 0-index

186

self.start_col = start[1]

189

self.start_col = start[1]

187

190

188

@classmethod

191

@classmethod

189

def find(cls, tokens_by_line):

192

def find(cls, tokens_by_line):

190

"""Find one instance of special syntax in the provided tokens.

193

"""Find one instance of special syntax in the provided tokens.

191

194

192

Tokens are grouped into logical lines for convenience,

195

Tokens are grouped into logical lines for convenience,

193

so it is easy to e.g. look at the first token of each line.

196

so it is easy to e.g. look at the first token of each line.

194

*tokens_by_line* is a list of lists of tokenize.TokenInfo objects.

197

*tokens_by_line* is a list of lists of tokenize.TokenInfo objects.

195

198

196

This should return an instance of its class, pointing to the start

199

This should return an instance of its class, pointing to the start

197

position it has found, or None if it found no match.

200

position it has found, or None if it found no match.

198

"""

201

"""

199

raise NotImplementedError

202

raise NotImplementedError

200

203

201

def transform(self, lines: List[str]):

204

def transform(self, lines: List[str]):

202

"""Transform one instance of special syntax found by ``find()``

205

"""Transform one instance of special syntax found by ``find()``

203

206

204

Takes a list of strings representing physical lines,

207

Takes a list of strings representing physical lines,

205

returns a similar list of transformed lines.

208

returns a similar list of transformed lines.

206

"""

209

"""

207

raise NotImplementedError

210

raise NotImplementedError

208

211

209

class MagicAssign(TokenTransformBase):

212

class MagicAssign(TokenTransformBase):

210

"""Transformer for assignments from magics (a = %foo)"""

213

"""Transformer for assignments from magics (a = %foo)"""

211

@classmethod

214

@classmethod

212

def find(cls, tokens_by_line):

215

def find(cls, tokens_by_line):

213

"""Find the first magic assignment (a = %foo) in the cell.

216

"""Find the first magic assignment (a = %foo) in the cell.

214

"""

217

"""

215

for line in tokens_by_line:

218

for line in tokens_by_line:

216

assign_ix = _find_assign_op(line)

219

assign_ix = _find_assign_op(line)

217

if (assign_ix is not None) \

220

if (assign_ix is not None) \

218

and (len(line) >= assign_ix + 2) \

221

and (len(line) >= assign_ix + 2) \

219

and (line[assign_ix+1].string == '%') \

222

and (line[assign_ix+1].string == '%') \

220

and (line[assign_ix+2].type == tokenize.NAME):

223

and (line[assign_ix+2].type == tokenize.NAME):

221

return cls(line[assign_ix+1].start)

224

return cls(line[assign_ix+1].start)

222

225

223

def transform(self, lines: List[str]):

226

def transform(self, lines: List[str]):

224

"""Transform a magic assignment found by the ``find()`` classmethod.

227

"""Transform a magic assignment found by the ``find()`` classmethod.

225

"""

228

"""

226

start_line, start_col = self.start_line, self.start_col

229

start_line, start_col = self.start_line, self.start_col

227

lhs = lines[start_line][:start_col]

230

lhs = lines[start_line][:start_col]

228

end_line = find_end_of_continued_line(lines, start_line)

231

end_line = find_end_of_continued_line(lines, start_line)

229

rhs = assemble_continued_line(lines, (start_line, start_col), end_line)

232

rhs = assemble_continued_line(lines, (start_line, start_col), end_line)

230

assert rhs.startswith('%'), rhs

233

assert rhs.startswith('%'), rhs

231

magic_name, _, args = rhs[1:].partition(' ')

234

magic_name, _, args = rhs[1:].partition(' ')

232

235

233

lines_before = lines[:start_line]

236

lines_before = lines[:start_line]

234

call = "get_ipython().run_line_magic({!r}, {!r})".format(magic_name, args)

237

call = "get_ipython().run_line_magic({!r}, {!r})".format(magic_name, args)

235

new_line = lhs + call + '\n'

238

new_line = lhs + call + '\n'

236

lines_after = lines[end_line+1:]

239

lines_after = lines[end_line+1:]

237

240

238

return lines_before + [new_line] + lines_after

241

return lines_before + [new_line] + lines_after

239

242

240

243

241

class SystemAssign(TokenTransformBase):

244

class SystemAssign(TokenTransformBase):

242

"""Transformer for assignments from system commands (a = !foo)"""

245

"""Transformer for assignments from system commands (a = !foo)"""

243

@classmethod

246

@classmethod

244

def find(cls, tokens_by_line):

247

def find(cls, tokens_by_line):

245

"""Find the first system assignment (a = !foo) in the cell.

248

"""Find the first system assignment (a = !foo) in the cell.

246

"""

249

"""

247

for line in tokens_by_line:

250

for line in tokens_by_line:

248

assign_ix = _find_assign_op(line)

251

assign_ix = _find_assign_op(line)

249

if (assign_ix is not None) \

252

if (assign_ix is not None) \

250

and not line[assign_ix].line.strip().startswith('=') \

253

and not line[assign_ix].line.strip().startswith('=') \

251

and (len(line) >= assign_ix + 2) \

254

and (len(line) >= assign_ix + 2) \

252

and (line[assign_ix + 1].type == tokenize.ERRORTOKEN):

255

and (line[assign_ix + 1].type == tokenize.ERRORTOKEN):

253

ix = assign_ix + 1

256

ix = assign_ix + 1

254

257

255

while ix < len(line) and line[ix].type == tokenize.ERRORTOKEN:

258

while ix < len(line) and line[ix].type == tokenize.ERRORTOKEN:

256

if line[ix].string == '!':

259

if line[ix].string == '!':

257

return cls(line[ix].start)

260

return cls(line[ix].start)

258

elif not line[ix].string.isspace():

261

elif not line[ix].string.isspace():

259

break

262

break

260

ix += 1

263

ix += 1

261

264

262

def transform(self, lines: List[str]):

265

def transform(self, lines: List[str]):

263

"""Transform a system assignment found by the ``find()`` classmethod.

266

"""Transform a system assignment found by the ``find()`` classmethod.

264

"""

267

"""

265

start_line, start_col = self.start_line, self.start_col

268

start_line, start_col = self.start_line, self.start_col

266

269

267

lhs = lines[start_line][:start_col]

270

lhs = lines[start_line][:start_col]

268

end_line = find_end_of_continued_line(lines, start_line)

271

end_line = find_end_of_continued_line(lines, start_line)

269

rhs = assemble_continued_line(lines, (start_line, start_col), end_line)

272

rhs = assemble_continued_line(lines, (start_line, start_col), end_line)

270

assert rhs.startswith('!'), rhs

273

assert rhs.startswith('!'), rhs

271

cmd = rhs[1:]

274

cmd = rhs[1:]

272

275

273

lines_before = lines[:start_line]

276

lines_before = lines[:start_line]

274

call = "get_ipython().getoutput({!r})".format(cmd)

277

call = "get_ipython().getoutput({!r})".format(cmd)

275

new_line = lhs + call + '\n'

278

new_line = lhs + call + '\n'

276

lines_after = lines[end_line + 1:]

279

lines_after = lines[end_line + 1:]

277

280

278

return lines_before + [new_line] + lines_after

281

return lines_before + [new_line] + lines_after

279

282

280

# The escape sequences that define the syntax transformations IPython will

283

# The escape sequences that define the syntax transformations IPython will

281

# apply to user input. These can NOT be just changed here: many regular

284

# apply to user input. These can NOT be just changed here: many regular

282

# expressions and other parts of the code may use their hardcoded values, and

285

# expressions and other parts of the code may use their hardcoded values, and

283

# for all intents and purposes they constitute the 'IPython syntax', so they

286

# for all intents and purposes they constitute the 'IPython syntax', so they

284

# should be considered fixed.

287

# should be considered fixed.

285

288

286

ESC_SHELL = '!' # Send line to underlying system shell

289

ESC_SHELL = '!' # Send line to underlying system shell

287

ESC_SH_CAP = '!!' # Send line to system shell and capture output

290

ESC_SH_CAP = '!!' # Send line to system shell and capture output

288

ESC_HELP = '?' # Find information about object

291

ESC_HELP = '?' # Find information about object

289

ESC_HELP2 = '??' # Find extra-detailed information about object

292

ESC_HELP2 = '??' # Find extra-detailed information about object

290

ESC_MAGIC = '%' # Call magic function

293

ESC_MAGIC = '%' # Call magic function

291

ESC_MAGIC2 = '%%' # Call cell-magic function

294

ESC_MAGIC2 = '%%' # Call cell-magic function

292

ESC_QUOTE = ',' # Split args on whitespace, quote each as string and call

295

ESC_QUOTE = ',' # Split args on whitespace, quote each as string and call

293

ESC_QUOTE2 = ';' # Quote all args as a single string, call

296

ESC_QUOTE2 = ';' # Quote all args as a single string, call

294

ESC_PAREN = '/' # Call first argument with rest of line as arguments

297

ESC_PAREN = '/' # Call first argument with rest of line as arguments

295

298

296

ESCAPE_SINGLES = {'!', '?', '%', ',', ';', '/'}

299

ESCAPE_SINGLES = {'!', '?', '%', ',', ';', '/'}

297

ESCAPE_DOUBLES = {'!!', '??'} # %% (cell magic) is handled separately

300

ESCAPE_DOUBLES = {'!!', '??'} # %% (cell magic) is handled separately

298

301

299

def _make_help_call(target, esc, next_input=None):

302

def _make_help_call(target, esc, next_input=None):

300

"""Prepares a pinfo(2)/psearch call from a target name and the escape

303

"""Prepares a pinfo(2)/psearch call from a target name and the escape

301

(i.e. ? or ??)"""

304

(i.e. ? or ??)"""

302

method = 'pinfo2' if esc == '??' \

305

method = 'pinfo2' if esc == '??' \

303

else 'psearch' if '*' in target \

306

else 'psearch' if '*' in target \

304

else 'pinfo'

307

else 'pinfo'

305

arg = " ".join([method, target])

308

arg = " ".join([method, target])

306

#Prepare arguments for get_ipython().run_line_magic(magic_name, magic_args)

309

#Prepare arguments for get_ipython().run_line_magic(magic_name, magic_args)

307

t_magic_name, _, t_magic_arg_s = arg.partition(' ')

310

t_magic_name, _, t_magic_arg_s = arg.partition(' ')

308

t_magic_name = t_magic_name.lstrip(ESC_MAGIC)

311

t_magic_name = t_magic_name.lstrip(ESC_MAGIC)

309

if next_input is None:

312

if next_input is None:

310

return 'get_ipython().run_line_magic(%r, %r)' % (t_magic_name, t_magic_arg_s)

313

return 'get_ipython().run_line_magic(%r, %r)' % (t_magic_name, t_magic_arg_s)

311

else:

314

else:

312

return 'get_ipython().set_next_input(%r);get_ipython().run_line_magic(%r, %r)' % \

315

return 'get_ipython().set_next_input(%r);get_ipython().run_line_magic(%r, %r)' % \

313

(next_input, t_magic_name, t_magic_arg_s)

316

(next_input, t_magic_name, t_magic_arg_s)

314

317

315

def _tr_help(content):

318

def _tr_help(content):

316

"""Translate lines escaped with: ?

319

"""Translate lines escaped with: ?

317

320

318

A naked help line should fire the intro help screen (shell.show_usage())

321

A naked help line should fire the intro help screen (shell.show_usage())

319

"""

322

"""

320

if not content:

323

if not content:

321

return 'get_ipython().show_usage()'

324

return 'get_ipython().show_usage()'

322

325

323

return _make_help_call(content, '?')

326

return _make_help_call(content, '?')

324

327

325

def _tr_help2(content):

328

def _tr_help2(content):

326

"""Translate lines escaped with: ??

329

"""Translate lines escaped with: ??

327

330

328

A naked help line should fire the intro help screen (shell.show_usage())

331

A naked help line should fire the intro help screen (shell.show_usage())

329

"""

332

"""

330

if not content:

333

if not content:

331

return 'get_ipython().show_usage()'

334

return 'get_ipython().show_usage()'

332

335

333

return _make_help_call(content, '??')

336

return _make_help_call(content, '??')

334

337

335

def _tr_magic(content):

338

def _tr_magic(content):

336

"Translate lines escaped with a percent sign: %"

339

"Translate lines escaped with a percent sign: %"

337

name, _, args = content.partition(' ')

340

name, _, args = content.partition(' ')

338

return 'get_ipython().run_line_magic(%r, %r)' % (name, args)

341

return 'get_ipython().run_line_magic(%r, %r)' % (name, args)

339

342

340

def _tr_quote(content):

343

def _tr_quote(content):

341

"Translate lines escaped with a comma: ,"

344

"Translate lines escaped with a comma: ,"

342

name, _, args = content.partition(' ')

345

name, _, args = content.partition(' ')

343

return '%s("%s")' % (name, '", "'.join(args.split()) )

346

return '%s("%s")' % (name, '", "'.join(args.split()) )

344

347

345

def _tr_quote2(content):

348

def _tr_quote2(content):

346

"Translate lines escaped with a semicolon: ;"

349

"Translate lines escaped with a semicolon: ;"

347

name, _, args = content.partition(' ')

350

name, _, args = content.partition(' ')

348

return '%s("%s")' % (name, args)

351

return '%s("%s")' % (name, args)

349

352

350

def _tr_paren(content):

353

def _tr_paren(content):

351

"Translate lines escaped with a slash: /"

354

"Translate lines escaped with a slash: /"

352

name, _, args = content.partition(' ')

355

name, _, args = content.partition(' ')

353

return '%s(%s)' % (name, ", ".join(args.split()))

356

return '%s(%s)' % (name, ", ".join(args.split()))

354

357

355

tr = { ESC_SHELL : 'get_ipython().system({!r})'.format,

358

tr = { ESC_SHELL : 'get_ipython().system({!r})'.format,

356

ESC_SH_CAP : 'get_ipython().getoutput({!r})'.format,

359

ESC_SH_CAP : 'get_ipython().getoutput({!r})'.format,

357

ESC_HELP : _tr_help,

360

ESC_HELP : _tr_help,

358

ESC_HELP2 : _tr_help2,

361

ESC_HELP2 : _tr_help2,

359

ESC_MAGIC : _tr_magic,

362

ESC_MAGIC : _tr_magic,

360

ESC_QUOTE : _tr_quote,

363

ESC_QUOTE : _tr_quote,

361

ESC_QUOTE2 : _tr_quote2,

364

ESC_QUOTE2 : _tr_quote2,

362

ESC_PAREN : _tr_paren }

365

ESC_PAREN : _tr_paren }

363

366

364

class EscapedCommand(TokenTransformBase):

367

class EscapedCommand(TokenTransformBase):

365

"""Transformer for escaped commands like %foo, !foo, or /foo"""

368

"""Transformer for escaped commands like %foo, !foo, or /foo"""

366

@classmethod

369

@classmethod

367

def find(cls, tokens_by_line):

370

def find(cls, tokens_by_line):

368

"""Find the first escaped command (%foo, !foo, etc.) in the cell.

371

"""Find the first escaped command (%foo, !foo, etc.) in the cell.

369

"""

372

"""

370

for line in tokens_by_line:

373

for line in tokens_by_line:

371

if not line:

374

if not line:

372

continue

375

continue

373

ix = 0

376

ix = 0

374

ll = len(line)

377

ll = len(line)

375

while ll > ix and line[ix].type in {tokenize.INDENT, tokenize.DEDENT}:

378

while ll > ix and line[ix].type in {tokenize.INDENT, tokenize.DEDENT}:

376

ix += 1

379

ix += 1

377

if ix >= ll:

380

if ix >= ll:

378

continue

381

continue

379

if line[ix].string in ESCAPE_SINGLES:

382

if line[ix].string in ESCAPE_SINGLES:

380

return cls(line[ix].start)

383

return cls(line[ix].start)

381

384

382

def transform(self, lines):

385

def transform(self, lines):

383

"""Transform an escaped line found by the ``find()`` classmethod.

386

"""Transform an escaped line found by the ``find()`` classmethod.

384

"""

387

"""

385

start_line, start_col = self.start_line, self.start_col

388

start_line, start_col = self.start_line, self.start_col

386

389

387

indent = lines[start_line][:start_col]

390

indent = lines[start_line][:start_col]

388

end_line = find_end_of_continued_line(lines, start_line)

391

end_line = find_end_of_continued_line(lines, start_line)

389

line = assemble_continued_line(lines, (start_line, start_col), end_line)

392

line = assemble_continued_line(lines, (start_line, start_col), end_line)

390

393

391

if len(line) > 1 and line[:2] in ESCAPE_DOUBLES:

394

if len(line) > 1 and line[:2] in ESCAPE_DOUBLES:

392

escape, content = line[:2], line[2:]

395

escape, content = line[:2], line[2:]

393

else:

396

else:

394

escape, content = line[:1], line[1:]

397

escape, content = line[:1], line[1:]

395

398

396

if escape in tr:

399

if escape in tr:

397

call = tr[escape](content)

400

call = tr[escape](content)

398

else:

401

else:

399

call = ''

402

call = ''

400

403

401

lines_before = lines[:start_line]

404

lines_before = lines[:start_line]

402

new_line = indent + call + '\n'

405

new_line = indent + call + '\n'

403

lines_after = lines[end_line + 1:]

406

lines_after = lines[end_line + 1:]

404

407

405

return lines_before + [new_line] + lines_after

408

return lines_before + [new_line] + lines_after

406

409

407

_help_end_re = re.compile(r"""(%{0,2}

410

_help_end_re = re.compile(r"""(%{0,2}

408

(?!\d)[\w*]+ # Variable name

411

(?!\d)[\w*]+ # Variable name

409

(\.(?!\d)[\w*]+)* # .etc.etc

412

(\.(?!\d)[\w*]+)* # .etc.etc

410

)

413

)

411

(\?\??)$ # ? or ??

414

(\?\??)$ # ? or ??

412

""",

415

""",

413

re.VERBOSE)

416

re.VERBOSE)

414

417

415

class HelpEnd(TokenTransformBase):

418

class HelpEnd(TokenTransformBase):

416

"""Transformer for help syntax: obj? and obj??"""

419

"""Transformer for help syntax: obj? and obj??"""

417

# This needs to be higher priority (lower number) than EscapedCommand so

420

# This needs to be higher priority (lower number) than EscapedCommand so

418

# that inspecting magics (%foo?) works.

421

# that inspecting magics (%foo?) works.

419

priority = 5

422

priority = 5

420

423

421

def __init__(self, start, q_locn):

424

def __init__(self, start, q_locn):

422

super().__init__(start)

425

super().__init__(start)

423

self.q_line = q_locn[0] - 1 # Shift from 1-indexed to 0-indexed

426

self.q_line = q_locn[0] - 1 # Shift from 1-indexed to 0-indexed

424

self.q_col = q_locn[1]

427

self.q_col = q_locn[1]

425

428

426

@classmethod

429

@classmethod

427

def find(cls, tokens_by_line):

430

def find(cls, tokens_by_line):

428

"""Find the first help command (foo?) in the cell.

431

"""Find the first help command (foo?) in the cell.

429

"""

432

"""

430

for line in tokens_by_line:

433

for line in tokens_by_line:

431

# Last token is NEWLINE; look at last but one

434

# Last token is NEWLINE; look at last but one

432

if len(line) > 2 and line[-2].string == '?':

435

if len(line) > 2 and line[-2].string == '?':

433

# Find the first token that's not INDENT/DEDENT

436

# Find the first token that's not INDENT/DEDENT

434

ix = 0

437

ix = 0

435

while line[ix].type in {tokenize.INDENT, tokenize.DEDENT}:

438

while line[ix].type in {tokenize.INDENT, tokenize.DEDENT}:

436

ix += 1

439

ix += 1

437

return cls(line[ix].start, line[-2].start)

440

return cls(line[ix].start, line[-2].start)

438

441

439

def transform(self, lines):

442

def transform(self, lines):

440

"""Transform a help command found by the ``find()`` classmethod.

443

"""Transform a help command found by the ``find()`` classmethod.

441

"""

444

"""

442

piece = ''.join(lines[self.start_line:self.q_line+1])

445

piece = ''.join(lines[self.start_line:self.q_line+1])

443

indent, content = piece[:self.start_col], piece[self.start_col:]

446

indent, content = piece[:self.start_col], piece[self.start_col:]

444

lines_before = lines[:self.start_line]

447

lines_before = lines[:self.start_line]

445

lines_after = lines[self.q_line + 1:]

448

lines_after = lines[self.q_line + 1:]

446

449

447

m = _help_end_re.search(content)

450

m = _help_end_re.search(content)

448

if not m:

451

if not m:

449

raise SyntaxError(content)

452

raise SyntaxError(content)

450

assert m is not None, content

453

assert m is not None, content

451

target = m.group(1)

454

target = m.group(1)

452

esc = m.group(3)

455

esc = m.group(3)

453

456

454

# If we're mid-command, put it back on the next prompt for the user.

457

# If we're mid-command, put it back on the next prompt for the user.

455

next_input = None

458

next_input = None

456

if (not lines_before) and (not lines_after) \

459

if (not lines_before) and (not lines_after) \

457

and content.strip() != m.group(0):

460

and content.strip() != m.group(0):

458

next_input = content.rstrip('?\n')

461

next_input = content.rstrip('?\n')

459

462

460

call = _make_help_call(target, esc, next_input=next_input)

463

call = _make_help_call(target, esc, next_input=next_input)

461

new_line = indent + call + '\n'

464

new_line = indent + call + '\n'

462

465

463

return lines_before + [new_line] + lines_after

466

return lines_before + [new_line] + lines_after

464

467

465

def make_tokens_by_line(lines:List[str]):

468

def make_tokens_by_line(lines:List[str]):

466

"""Tokenize a series of lines and group tokens by line.

469

"""Tokenize a series of lines and group tokens by line.

467

470

468

The tokens for a multiline Python string or expression are grouped as one

471

The tokens for a multiline Python string or expression are grouped as one

469

line. All lines except the last lines should keep their line ending ('\\n',

472

line. All lines except the last lines should keep their line ending ('\\n',

470

'\\r\\n') for this to properly work. Use `.splitlines(keeplineending=True)`

473

'\\r\\n') for this to properly work. Use `.splitlines(keeplineending=True)`

471

for example when passing block of text to this function.

474

for example when passing block of text to this function.

472

475

473

"""

476

"""

474

# NL tokens are used inside multiline expressions, but also after blank

477

# NL tokens are used inside multiline expressions, but also after blank

475

# lines or comments. This is intentional - see https://bugs.python.org/issue17061

478

# lines or comments. This is intentional - see https://bugs.python.org/issue17061

476

# We want to group the former case together but split the latter, so we

479

# We want to group the former case together but split the latter, so we

477

# track parentheses level, similar to the internals of tokenize.

480

# track parentheses level, similar to the internals of tokenize.

478

NEWLINE, NL = tokenize.NEWLINE, tokenize.NL

481

NEWLINE, NL = tokenize.NEWLINE, tokenize.NL

479

tokens_by_line = [[]]

482

tokens_by_line = [[]]

480

if len(lines) > 1 and not lines[0].endswith(('\n', '\r', '\r\n', '\x0b', '\x0c')):

483

if len(lines) > 1 and not lines[0].endswith(('\n', '\r', '\r\n', '\x0b', '\x0c')):

481

warnings.warn("`make_tokens_by_line` received a list of lines which do not have lineending markers ('\\n', '\\r', '\\r\\n', '\\x0b', '\\x0c'), behavior will be unspecified")

484

warnings.warn("`make_tokens_by_line` received a list of lines which do not have lineending markers ('\\n', '\\r', '\\r\\n', '\\x0b', '\\x0c'), behavior will be unspecified")

482

parenlev = 0

485

parenlev = 0

483

try:

486

try:

484

for token in tokenize.generate_tokens(iter(lines).__next__):

487

for token in tokenize.generate_tokens(iter(lines).__next__):

485

tokens_by_line[-1].append(token)

488

tokens_by_line[-1].append(token)

486

if (token.type == NEWLINE) \

489

if (token.type == NEWLINE) \

487

or ((token.type == NL) and (parenlev <= 0)):

490

or ((token.type == NL) and (parenlev <= 0)):

488

tokens_by_line.append([])

491

tokens_by_line.append([])

489

elif token.string in {'(', '[', '{'}:

492

elif token.string in {'(', '[', '{'}:

490

parenlev += 1

493

parenlev += 1

491

elif token.string in {')', ']', '}'}:

494

elif token.string in {')', ']', '}'}:

492

if parenlev > 0:

495

if parenlev > 0:

493

parenlev -= 1

496

parenlev -= 1

494

except tokenize.TokenError:

497

except tokenize.TokenError:

495

# Input ended in a multiline string or expression. That's OK for us.

498

# Input ended in a multiline string or expression. That's OK for us.

496

pass

499

pass

497

500

498

501

499

if not tokens_by_line[-1]:

502

if not tokens_by_line[-1]:

500

tokens_by_line.pop()

503

tokens_by_line.pop()

501

504

502

505

503

return tokens_by_line

506

return tokens_by_line

504

507

505

def show_linewise_tokens(s: str):

508

def show_linewise_tokens(s: str):

506

"""For investigation and debugging"""

509

"""For investigation and debugging"""

507

if not s.endswith('\n'):

510

if not s.endswith('\n'):

508

s += '\n'

511

s += '\n'

509

lines = s.splitlines(keepends=True)

512

lines = s.splitlines(keepends=True)

510

for line in make_tokens_by_line(lines):

513

for line in make_tokens_by_line(lines):

511

print("Line -------")

514

print("Line -------")

512

for tokinfo in line:

515

for tokinfo in line:

513

print(" ", tokinfo)

516

print(" ", tokinfo)

514

517

515

# Arbitrary limit to prevent getting stuck in infinite loops

518

# Arbitrary limit to prevent getting stuck in infinite loops

516

TRANSFORM_LOOP_LIMIT = 500

519

TRANSFORM_LOOP_LIMIT = 500

517

520

518

class TransformerManager:

521

class TransformerManager:

519

"""Applies various transformations to a cell or code block.

522

"""Applies various transformations to a cell or code block.

520

523

521

The key methods for external use are ``transform_cell()``

524

The key methods for external use are ``transform_cell()``

522

and ``check_complete()``.

525

and ``check_complete()``.

523

"""

526

"""

524

def __init__(self):

527

def __init__(self):

525

self.cleanup_transforms = [

528

self.cleanup_transforms = [

526

leading_empty_lines,

529

leading_empty_lines,

527

leading_indent,

530

leading_indent,

528

classic_prompt,

531

classic_prompt,

529

ipython_prompt,

532

ipython_prompt,

530

]

533

]

531

self.line_transforms = [

534

self.line_transforms = [

532

cell_magic,

535

cell_magic,

533

]

536

]

534

self.token_transformers = [

537

self.token_transformers = [

535

MagicAssign,

538

MagicAssign,

536

SystemAssign,

539

SystemAssign,

537

EscapedCommand,

540

EscapedCommand,

538

HelpEnd,

541

HelpEnd,

539

]

542

]

540

543

541

def do_one_token_transform(self, lines):

544

def do_one_token_transform(self, lines):

542

"""Find and run the transform earliest in the code.

545

"""Find and run the transform earliest in the code.

543

546

544

Returns (changed, lines).

547

Returns (changed, lines).

545

548

546

This method is called repeatedly until changed is False, indicating

549

This method is called repeatedly until changed is False, indicating

547

that all available transformations are complete.

550

that all available transformations are complete.

548

551

549

The tokens following IPython special syntax might not be valid, so

552

The tokens following IPython special syntax might not be valid, so

550

the transformed code is retokenised every time to identify the next

553

the transformed code is retokenised every time to identify the next

551

piece of special syntax. Hopefully long code cells are mostly valid

554

piece of special syntax. Hopefully long code cells are mostly valid

552

Python, not using lots of IPython special syntax, so this shouldn't be

555

Python, not using lots of IPython special syntax, so this shouldn't be

553

a performance issue.

556

a performance issue.

554

"""

557

"""

555

tokens_by_line = make_tokens_by_line(lines)

558

tokens_by_line = make_tokens_by_line(lines)

556

candidates = []

559

candidates = []

557

for transformer_cls in self.token_transformers:

560

for transformer_cls in self.token_transformers:

558

transformer = transformer_cls.find(tokens_by_line)

561

transformer = transformer_cls.find(tokens_by_line)

559

if transformer:

562

if transformer:

560

candidates.append(transformer)

563

candidates.append(transformer)

561

564

562

if not candidates:

565

if not candidates:

563

# Nothing to transform

566

# Nothing to transform

564

return False, lines

567

return False, lines

565

ordered_transformers = sorted(candidates, key=TokenTransformBase.sortby)

568

ordered_transformers = sorted(candidates, key=TokenTransformBase.sortby)

566

for transformer in ordered_transformers:

569

for transformer in ordered_transformers:

567

try:

570

try:

568

return True, transformer.transform(lines)

571

return True, transformer.transform(lines)

569

except SyntaxError:

572

except SyntaxError:

570

pass

573

pass

571

return False, lines

574

return False, lines

572

575

573

def do_token_transforms(self, lines):

576

def do_token_transforms(self, lines):

574

for _ in range(TRANSFORM_LOOP_LIMIT):

577

for _ in range(TRANSFORM_LOOP_LIMIT):

575

changed, lines = self.do_one_token_transform(lines)

578

changed, lines = self.do_one_token_transform(lines)

576

if not changed:

579

if not changed:

577

return lines

580

return lines

578

581

579

raise RuntimeError("Input transformation still changing after "

582

raise RuntimeError("Input transformation still changing after "

580

"%d iterations. Aborting." % TRANSFORM_LOOP_LIMIT)

583

"%d iterations. Aborting." % TRANSFORM_LOOP_LIMIT)

581

584

582

def transform_cell(self, cell: str) -> str:

585

def transform_cell(self, cell: str) -> str:

583

"""Transforms a cell of input code"""

586

"""Transforms a cell of input code"""

584

if not cell.endswith('\n'):

587

if not cell.endswith('\n'):

585

cell += '\n' # Ensure the cell has a trailing newline

588

cell += '\n' # Ensure the cell has a trailing newline

586

lines = cell.splitlines(keepends=True)

589

lines = cell.splitlines(keepends=True)

587

for transform in self.cleanup_transforms + self.line_transforms:

590

for transform in self.cleanup_transforms + self.line_transforms:

588

lines = transform(lines)

591

lines = transform(lines)

589

592

590

lines = self.do_token_transforms(lines)

593

lines = self.do_token_transforms(lines)

591

return ''.join(lines)

594

return ''.join(lines)

592

595

593

def check_complete(self, cell: str):

596

def check_complete(self, cell: str):

594

"""Return whether a block of code is ready to execute, or should be continued

597

"""Return whether a block of code is ready to execute, or should be continued

595

598

596

Parameters

599

Parameters

597

----------

600

----------

598

source : string

601

source : string

599

Python input code, which can be multiline.

602

Python input code, which can be multiline.

600

603

601

Returns

604

Returns

602

-------

605

-------

603

status : str

606

status : str

604

One of 'complete', 'incomplete', or 'invalid' if source is not a

607

One of 'complete', 'incomplete', or 'invalid' if source is not a

605

prefix of valid code.

608

prefix of valid code.

606

indent_spaces : int or None

609

indent_spaces : int or None

607

The number of spaces by which to indent the next line of code. If

610

The number of spaces by which to indent the next line of code. If

608

status is not 'incomplete', this is None.

611

status is not 'incomplete', this is None.

609

"""

612

"""

610

# Remember if the lines ends in a new line.

613

# Remember if the lines ends in a new line.

611

ends_with_newline = False

614

ends_with_newline = False

612

for character in reversed(cell):

615

for character in reversed(cell):

613

if character == '\n':

616

if character == '\n':

614

ends_with_newline = True

617

ends_with_newline = True

615

break

618

break

616

elif character.strip():

619

elif character.strip():

617

break

620

break

618

else:

621

else:

619

continue

622

continue

620

623

621

if not ends_with_newline:

624

if not ends_with_newline:

622

# Append an newline for consistent tokenization

625

# Append an newline for consistent tokenization

623

# See https://bugs.python.org/issue33899

626

# See https://bugs.python.org/issue33899

624

cell += '\n'

627

cell += '\n'

625

628

626

lines = cell.splitlines(keepends=True)

629

lines = cell.splitlines(keepends=True)

627

630

628

if not lines:

631

if not lines:

629

return 'complete', None

632

return 'complete', None

630

633

631

if lines[-1].endswith('\\'):

634

if lines[-1].endswith('\\'):

632

# Explicit backslash continuation

635

# Explicit backslash continuation

633

return 'incomplete', find_last_indent(lines)

636

return 'incomplete', find_last_indent(lines)

634

637

635

try:

638

try:

636

for transform in self.cleanup_transforms:

639

for transform in self.cleanup_transforms:

637

if not getattr(transform, 'has_side_effects', False):

640

if not getattr(transform, 'has_side_effects', False):

638

lines = transform(lines)

641

lines = transform(lines)

639

except SyntaxError:

642

except SyntaxError:

640

return 'invalid', None

643

return 'invalid', None

641

644

642

if lines[0].startswith('%%'):

645

if lines[0].startswith('%%'):

643

# Special case for cell magics - completion marked by blank line

646

# Special case for cell magics - completion marked by blank line

644

if lines[-1].strip():

647

if lines[-1].strip():

645

return 'incomplete', find_last_indent(lines)

648

return 'incomplete', find_last_indent(lines)

646

else:

649

else:

647

return 'complete', None

650

return 'complete', None

648

651

649

try:

652

try:

650

for transform in self.line_transforms:

653

for transform in self.line_transforms:

651

if not getattr(transform, 'has_side_effects', False):

654

if not getattr(transform, 'has_side_effects', False):

652

lines = transform(lines)

655

lines = transform(lines)

653

lines = self.do_token_transforms(lines)

656

lines = self.do_token_transforms(lines)

654

except SyntaxError:

657

except SyntaxError:

655

return 'invalid', None

658

return 'invalid', None

656

659

657

tokens_by_line = make_tokens_by_line(lines)

660

tokens_by_line = make_tokens_by_line(lines)

658

661

659

if not tokens_by_line:

662

if not tokens_by_line:

660

return 'incomplete', find_last_indent(lines)

663

return 'incomplete', find_last_indent(lines)

661

664

662

if tokens_by_line[-1][-1].type != tokenize.ENDMARKER:

665

if tokens_by_line[-1][-1].type != tokenize.ENDMARKER:

663

# We're in a multiline string or expression

666

# We're in a multiline string or expression

664

return 'incomplete', find_last_indent(lines)

667

return 'incomplete', find_last_indent(lines)

665

668

666

newline_types = {tokenize.NEWLINE, tokenize.COMMENT, tokenize.ENDMARKER}

669

newline_types = {tokenize.NEWLINE, tokenize.COMMENT, tokenize.ENDMARKER}

667

670

668

# Pop the last line which only contains DEDENTs and ENDMARKER

671

# Pop the last line which only contains DEDENTs and ENDMARKER

669

last_token_line = None

672

last_token_line = None

670

if {t.type for t in tokens_by_line[-1]} in [

673

if {t.type for t in tokens_by_line[-1]} in [

671

{tokenize.DEDENT, tokenize.ENDMARKER},

674

{tokenize.DEDENT, tokenize.ENDMARKER},

672

{tokenize.ENDMARKER}

675

{tokenize.ENDMARKER}

673

] and len(tokens_by_line) > 1:

676

] and len(tokens_by_line) > 1:

674

last_token_line = tokens_by_line.pop()

677

last_token_line = tokens_by_line.pop()

675

678

676

while tokens_by_line[-1] and tokens_by_line[-1][-1].type in newline_types:

679

while tokens_by_line[-1] and tokens_by_line[-1][-1].type in newline_types:

677

tokens_by_line[-1].pop()

680

tokens_by_line[-1].pop()

678

681

679

if not tokens_by_line[-1]:

682

if not tokens_by_line[-1]:

680

return 'incomplete', find_last_indent(lines)

683

return 'incomplete', find_last_indent(lines)

681

684

682

if tokens_by_line[-1][-1].string == ':':

685

if tokens_by_line[-1][-1].string == ':':

683

# The last line starts a block (e.g. 'if foo:')

686

# The last line starts a block (e.g. 'if foo:')

684

ix = 0

687

ix = 0

685

while tokens_by_line[-1][ix].type in {tokenize.INDENT, tokenize.DEDENT}:

688

while tokens_by_line[-1][ix].type in {tokenize.INDENT, tokenize.DEDENT}:

686

ix += 1

689

ix += 1

687

690

688

indent = tokens_by_line[-1][ix].start[1]

691

indent = tokens_by_line[-1][ix].start[1]

689

return 'incomplete', indent + 4

692

return 'incomplete', indent + 4

690

693

691

if tokens_by_line[-1][0].line.endswith('\\'):

694

if tokens_by_line[-1][0].line.endswith('\\'):

692

return 'incomplete', None

695

return 'incomplete', None

693

696

694

# At this point, our checks think the code is complete (or invalid).

697

# At this point, our checks think the code is complete (or invalid).

695

# We'll use codeop.compile_command to check this with the real parser

698

# We'll use codeop.compile_command to check this with the real parser

696

try:

699

try:

697

with warnings.catch_warnings():

700

with warnings.catch_warnings():

698

warnings.simplefilter('error', SyntaxWarning)

701

warnings.simplefilter('error', SyntaxWarning)

699

res = compile_command(''.join(lines), symbol='exec')

702

res = compile_command(''.join(lines), symbol='exec')

700

except (SyntaxError, OverflowError, ValueError, TypeError,

703

except (SyntaxError, OverflowError, ValueError, TypeError,

701

MemoryError, SyntaxWarning):

704

MemoryError, SyntaxWarning):

702

return 'invalid', None

705

return 'invalid', None

703

else:

706

else:

704

if res is None:

707

if res is None:

705

return 'incomplete', find_last_indent(lines)

708

return 'incomplete', find_last_indent(lines)

706

709

707

if last_token_line and last_token_line[0].type == tokenize.DEDENT:

710

if last_token_line and last_token_line[0].type == tokenize.DEDENT:

708

if ends_with_newline:

711

if ends_with_newline:

709

return 'complete', None

712

return 'complete', None

710

return 'incomplete', find_last_indent(lines)

713

return 'incomplete', find_last_indent(lines)

711

714

712

# If there's a blank line at the end, assume we're ready to execute

715

# If there's a blank line at the end, assume we're ready to execute

713

if not lines[-1].strip():

716

if not lines[-1].strip():

714

return 'complete', None

717

return 'complete', None

715

718

716

return 'complete', None

719

return 'complete', None

717

720

718

721

719

def find_last_indent(lines):

722

def find_last_indent(lines):

720

m = _indent_re.match(lines[-1])

723

m = _indent_re.match(lines[-1])

721

if not m:

724

if not m:

722

return 0

725

return 0

723

return len(m.group(0).replace('\t', ' '*4))

726

return len(m.group(0).replace('\t', ' '*4))

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages

             """Input transformer machinery to support IPython special syntax.
             This includes the machinery to recognise and transform ``%magic`` commands,
             ``!system`` commands, ``help?`` querying, prompt stripping, and so forth.
             Added: IPython 7.0. Replaces inputsplitter and inputtransformer which were
             deprecated in 7.0.
             """
             # Copyright (c) IPython Development Team.
             # Distributed under the terms of the Modified BSD License.
             from codeop import compile_command
             import re
             import tokenize
             from typing import List, Tuple, Union
             import warnings
             _indent_re = re.compile(r'^[ \t]+')
             def leading_empty_lines(lines):
                 """Remove leading empty lines
                 If the leading lines are empty or contain only whitespace, they will be
                 removed.
                 """
                 if not lines:
                     return lines
                 for i, line in enumerate(lines):
                     if line and not line.isspace():
                         return lines[i:]
                 return lines
             def leading_indent(lines):
                 """Remove leading indentation.
                 If the first line starts with a spaces or tabs, the same whitespace will be
                 removed from each following line in the cell.
                 """
                 if not lines:
                     return lines
                 m = _indent_re.match(lines[0])
                 if not m:
                     return lines
                 space = m.group(0)
                 n = len(space)
                 return [l[n:] if l.startswith(space) else l
                         for l in lines]
             class PromptStripper:
                 """Remove matching input prompts from a block of input.
                 Parameters
                 ----------
                 prompt_re : regular expression
                     A regular expression matching any input prompt (including continuation,
                     e.g. ``...``)
                 initial_re : regular expression, optional
                     A regular expression matching only the initial prompt, but not continuation.
                     If no initial expression is given, prompt_re will be used everywhere.
                     Used mainly for plain Python prompts (``>>>``), where the continuation prompt
                     ``...`` is a valid Python expression in Python 3, so shouldn't be stripped.
+                Notes
+                -----
                 If initial_re and prompt_re differ,
                 only initial_re will be tested against the first line.
                 If any prompt is found on the first two lines,
                 prompts will be stripped from the rest of the block.
                 """
                 def __init__(self, prompt_re, initial_re=None):
                     self.prompt_re = prompt_re
                     self.initial_re = initial_re or prompt_re
                 def _strip(self, lines):
                     return [self.prompt_re.sub('', l, count=1) for l in lines]
                 def __call__(self, lines):
                     if not lines:
                         return lines
                     if self.initial_re.match(lines[0]) or \
                             (len(lines) > 1 and self.prompt_re.match(lines[1])):
                         return self._strip(lines)
                     return lines
             classic_prompt = PromptStripper(
                 prompt_re=re.compile(r'^(>>>|\.\.\.)( |$)'),
                 initial_re=re.compile(r'^>>>( |$)')
             )
             ipython_prompt = PromptStripper(re.compile(r'^(In \[\d+\]: |\s*\.{3,}: ?)'))
             def cell_magic(lines):
                 if not lines or not lines[0].startswith('%%'):
                     return lines
                 if re.match(r'%%\w+\?', lines[0]):
                     # This case will be handled by help_end
                     return lines
                 magic_name, _, first_line = lines[0][2:].rstrip().partition(' ')
                 body = ''.join(lines[1:])
                 return ['get_ipython().run_cell_magic(%r, %r, %r)\n'
                         % (magic_name, first_line, body)]
             def _find_assign_op(token_line) -> Union[int, None]:
                 """Get the index of the first assignment in the line ('=' not inside brackets)
                 Note: We don't try to support multiple special assignment (a = b = %foo)
                 """
                 paren_level = 0
                 for i, ti in enumerate(token_line):
                     s = ti.string
                     if s == '=' and paren_level == 0:
                         return i
                     if s in {'(','[','{'}:
                         paren_level += 1
                     elif s in {')', ']', '}'}:
                         if paren_level > 0:
                             paren_level -= 1
             def find_end_of_continued_line(lines, start_line: int):
                 """Find the last line of a line explicitly extended using backslashes.
                 Uses 0-indexed line numbers.
                 """
                 end_line = start_line
                 while lines[end_line].endswith('\\\n'):
                     end_line += 1
                     if end_line >= len(lines):
                         break
                 return end_line
             def assemble_continued_line(lines, start: Tuple[int, int], end_line: int):
                 r"""Assemble a single line from multiple continued line pieces
                 Continued lines are lines ending in ``\``, and the line following the last
                 ``\`` in the block.
                 For example, this code continues over multiple lines::
                     if (assign_ix is not None) \
                          and (len(line) >= assign_ix + 2) \
                          and (line[assign_ix+1].string == '%') \
                          and (line[assign_ix+2].type == tokenize.NAME):
                 This statement contains four continued line pieces.
                 Assembling these pieces into a single line would give::
                     if (assign_ix is not None) and (len(line) >= assign_ix + 2) and (line[...
                 This uses 0-indexed line numbers. *start* is (lineno, colno).
                 Used to allow ``%magic`` and ``!system`` commands to be continued over
                 multiple lines.
                 """
                 parts = [lines[start[0]][start[1]:]] + lines[start[0]+1:end_line+1]
                 return ' '.join([p.rstrip()[:-1] for p in parts[:-1]]  # Strip backslash+newline
                                 + [parts[-1].rstrip()])         # Strip newline from last line
             class TokenTransformBase:
                 """Base class for transformations which examine tokens.
                 Special syntax should not be transformed when it occurs inside strings or
                 comments. This is hard to reliably avoid with regexes. The solution is to
                 tokenise the code as Python, and recognise the special syntax in the tokens.
                 IPython's special syntax is not valid Python syntax, so tokenising may go
                 wrong after the special syntax starts. These classes therefore find and
                 transform *one* instance of special syntax at a time into regular Python
                 syntax. After each transformation, tokens are regenerated to find the next
                 piece of special syntax.
                 Subclasses need to implement one class method (find)
                 and one regular method (transform).
                 The priority attribute can select which transformation to apply if multiple
                 transformers match in the same place. Lower numbers have higher priority.
                 This allows "%magic?" to be turned into a help call rather than a magic call.
                 """
                 # Lower numbers -> higher priority (for matches in the same location)
                 priority = 10
                 def sortby(self):
                     return self.start_line, self.start_col, self.priority
                 def __init__(self, start):
                     self.start_line = start[0] - 1   # Shift from 1-index to 0-index
                     self.start_col = start[1]
                 @classmethod
                 def find(cls, tokens_by_line):
                     """Find one instance of special syntax in the provided tokens.
                     Tokens are grouped into logical lines for convenience,
                     so it is easy to e.g. look at the first token of each line.
                     *tokens_by_line* is a list of lists of tokenize.TokenInfo objects.
                     This should return an instance of its class, pointing to the start
                     position it has found, or None if it found no match.
                     """
                     raise NotImplementedError
                 def transform(self, lines: List[str]):
                     """Transform one instance of special syntax found by ``find()``
                     Takes a list of strings representing physical lines,
                     returns a similar list of transformed lines.
                     """
                     raise NotImplementedError
             class MagicAssign(TokenTransformBase):
                 """Transformer for assignments from magics (a = %foo)"""
                 @classmethod
                 def find(cls, tokens_by_line):
                     """Find the first magic assignment (a = %foo) in the cell.
                     """
                     for line in tokens_by_line:
                         assign_ix = _find_assign_op(line)
                         if (assign_ix is not None) \
                                 and (len(line) >= assign_ix + 2) \
                                 and (line[assign_ix+1].string == '%') \
                                 and (line[assign_ix+2].type == tokenize.NAME):
                             return cls(line[assign_ix+1].start)
                 def transform(self, lines: List[str]):
                     """Transform a magic assignment found by the ``find()`` classmethod.
                     """
                     start_line, start_col = self.start_line, self.start_col
                     lhs = lines[start_line][:start_col]
                     end_line = find_end_of_continued_line(lines, start_line)
                     rhs = assemble_continued_line(lines, (start_line, start_col), end_line)
                     assert rhs.startswith('%'), rhs
                     magic_name, _, args = rhs[1:].partition(' ')
                     lines_before = lines[:start_line]
                     call = "get_ipython().run_line_magic({!r}, {!r})".format(magic_name, args)
                     new_line = lhs + call + '\n'
                     lines_after = lines[end_line+1:]
                     return lines_before + [new_line] + lines_after
             class SystemAssign(TokenTransformBase):
                 """Transformer for assignments from system commands (a = !foo)"""
                 @classmethod
                 def find(cls, tokens_by_line):
                     """Find the first system assignment (a = !foo) in the cell.
                     """
                     for line in tokens_by_line:
                         assign_ix = _find_assign_op(line)
                         if (assign_ix is not None) \
                                 and not line[assign_ix].line.strip().startswith('=') \
                                 and (len(line) >= assign_ix + 2) \
                                 and (line[assign_ix + 1].type == tokenize.ERRORTOKEN):
                             ix = assign_ix + 1
                             while ix < len(line) and line[ix].type == tokenize.ERRORTOKEN:
                                 if line[ix].string == '!':
                                     return cls(line[ix].start)
                                 elif not line[ix].string.isspace():
                                     break
                                 ix += 1
                 def transform(self, lines: List[str]):
                     """Transform a system assignment found by the ``find()`` classmethod.
                     """
                     start_line, start_col = self.start_line, self.start_col
                     lhs = lines[start_line][:start_col]
                     end_line = find_end_of_continued_line(lines, start_line)
                     rhs = assemble_continued_line(lines, (start_line, start_col), end_line)
                     assert rhs.startswith('!'), rhs
                     cmd = rhs[1:]
                     lines_before = lines[:start_line]
                     call = "get_ipython().getoutput({!r})".format(cmd)
                     new_line = lhs + call + '\n'
                     lines_after = lines[end_line + 1:]
                     return lines_before + [new_line] + lines_after
             # The escape sequences that define the syntax transformations IPython will
             # apply to user input.  These can NOT be just changed here: many regular
             # expressions and other parts of the code may use their hardcoded values, and
             # for all intents and purposes they constitute the 'IPython syntax', so they
             # should be considered fixed.
             ESC_SHELL  = '!'     # Send line to underlying system shell
             ESC_SH_CAP = '!!'    # Send line to system shell and capture output
             ESC_HELP   = '?'     # Find information about object
             ESC_HELP2  = '??'    # Find extra-detailed information about object
             ESC_MAGIC  = '%'     # Call magic function
             ESC_MAGIC2 = '%%'    # Call cell-magic function
             ESC_QUOTE  = ','     # Split args on whitespace, quote each as string and call
             ESC_QUOTE2 = ';'     # Quote all args as a single string, call
             ESC_PAREN  = '/'     # Call first argument with rest of line as arguments
             ESCAPE_SINGLES = {'!', '?', '%', ',', ';', '/'}
             ESCAPE_DOUBLES = {'!!', '??'}  # %% (cell magic) is handled separately
             def _make_help_call(target, esc, next_input=None):
                 """Prepares a pinfo(2)/psearch call from a target name and the escape
                 (i.e. ? or ??)"""
                 method  = 'pinfo2' if esc == '??' \
                             else 'psearch' if '*' in target \
                             else 'pinfo'
                 arg = " ".join([method, target])
                 #Prepare arguments for get_ipython().run_line_magic(magic_name, magic_args)
                 t_magic_name, _, t_magic_arg_s = arg.partition(' ')
                 t_magic_name = t_magic_name.lstrip(ESC_MAGIC)
                 if next_input is None:
                     return 'get_ipython().run_line_magic(%r, %r)' % (t_magic_name, t_magic_arg_s)
                 else:
                     return 'get_ipython().set_next_input(%r);get_ipython().run_line_magic(%r, %r)' % \
                        (next_input, t_magic_name, t_magic_arg_s)
             def _tr_help(content):
                 """Translate lines escaped with: ?
                 A naked help line should fire the intro help screen (shell.show_usage())
                 """
                 if not content:
                     return 'get_ipython().show_usage()'
                 return _make_help_call(content, '?')
             def _tr_help2(content):
                 """Translate lines escaped with: ??
                 A naked help line should fire the intro help screen (shell.show_usage())
                 """
                 if not content:
                     return 'get_ipython().show_usage()'
                 return _make_help_call(content, '??')
             def _tr_magic(content):
                 "Translate lines escaped with a percent sign: %"
                 name, _, args = content.partition(' ')
                 return 'get_ipython().run_line_magic(%r, %r)' % (name, args)
             def _tr_quote(content):
                 "Translate lines escaped with a comma: ,"
                 name, _, args = content.partition(' ')
                 return '%s("%s")' % (name, '", "'.join(args.split()) )
             def _tr_quote2(content):
                 "Translate lines escaped with a semicolon: ;"
                 name, _, args = content.partition(' ')
                 return '%s("%s")' % (name, args)
             def _tr_paren(content):
                 "Translate lines escaped with a slash: /"
                 name, _, args = content.partition(' ')
                 return '%s(%s)' % (name, ", ".join(args.split()))
             tr = { ESC_SHELL  : 'get_ipython().system({!r})'.format,
                    ESC_SH_CAP : 'get_ipython().getoutput({!r})'.format,
                    ESC_HELP   : _tr_help,
                    ESC_HELP2  : _tr_help2,
                    ESC_MAGIC  : _tr_magic,
                    ESC_QUOTE  : _tr_quote,
                    ESC_QUOTE2 : _tr_quote2,
                    ESC_PAREN  : _tr_paren }
             class EscapedCommand(TokenTransformBase):
                 """Transformer for escaped commands like %foo, !foo, or /foo"""
                 @classmethod
                 def find(cls, tokens_by_line):
                     """Find the first escaped command (%foo, !foo, etc.) in the cell.
                     """
                     for line in tokens_by_line:
                         if not line:
                             continue
                         ix = 0
                         ll = len(line)
                         while ll > ix and line[ix].type in {tokenize.INDENT, tokenize.DEDENT}:
                             ix += 1
                         if ix >= ll:
                             continue
                         if line[ix].string in ESCAPE_SINGLES:
                             return cls(line[ix].start)
                 def transform(self, lines):
                     """Transform an escaped line found by the ``find()`` classmethod.
                     """
                     start_line, start_col = self.start_line, self.start_col
                     indent = lines[start_line][:start_col]
                     end_line = find_end_of_continued_line(lines, start_line)
                     line = assemble_continued_line(lines, (start_line, start_col), end_line)
                     if len(line) > 1 and line[:2] in ESCAPE_DOUBLES:
                         escape, content = line[:2], line[2:]
                     else:
                         escape, content = line[:1], line[1:]
                     if escape in tr:
                         call = tr[escape](content)
                     else:
                         call = ''
                     lines_before = lines[:start_line]
                     new_line = indent + call + '\n'
                     lines_after = lines[end_line + 1:]
                     return lines_before + [new_line] + lines_after
             _help_end_re = re.compile(r"""(%{0,2}
                                           (?!\d)[\w*]+            # Variable name
                                           (\.(?!\d)[\w*]+)*       # .etc.etc
                                           )
                                           (\?\??)$                # ? or ??
                                           """,
                                           re.VERBOSE)
             class HelpEnd(TokenTransformBase):
                 """Transformer for help syntax: obj? and obj??"""
                 # This needs to be higher priority (lower number) than EscapedCommand so
                 # that inspecting magics (%foo?) works.
                 priority = 5
                 def __init__(self, start, q_locn):
                     super().__init__(start)
                     self.q_line = q_locn[0] - 1  # Shift from 1-indexed to 0-indexed
                     self.q_col = q_locn[1]
                 @classmethod
                 def find(cls, tokens_by_line):
                     """Find the first help command (foo?) in the cell.
                     """
                     for line in tokens_by_line:
                         # Last token is NEWLINE; look at last but one
                         if len(line) > 2 and line[-2].string == '?':
                             # Find the first token that's not INDENT/DEDENT
                             ix = 0
                             while line[ix].type in {tokenize.INDENT, tokenize.DEDENT}:
                                 ix += 1
                             return cls(line[ix].start, line[-2].start)
                 def transform(self, lines):
                     """Transform a help command found by the ``find()`` classmethod.
                     """
                     piece = ''.join(lines[self.start_line:self.q_line+1])
                     indent, content = piece[:self.start_col], piece[self.start_col:]
                     lines_before = lines[:self.start_line]
                     lines_after = lines[self.q_line + 1:]
                     m = _help_end_re.search(content)
                     if not m:
                         raise SyntaxError(content)
                     assert m is not None, content
                     target = m.group(1)
                     esc = m.group(3)
                     # If we're mid-command, put it back on the next prompt for the user.
                     next_input = None
                     if (not lines_before) and (not lines_after) \
                             and content.strip() != m.group(0):
                         next_input = content.rstrip('?\n')
                     call = _make_help_call(target, esc, next_input=next_input)
                     new_line = indent + call + '\n'
                     return lines_before + [new_line] + lines_after
             def make_tokens_by_line(lines:List[str]):
                 """Tokenize a series of lines and group tokens by line.
                 The tokens for a multiline Python string or expression are grouped as one
                 line. All lines except the last lines should keep their line ending ('\\n',
                 '\\r\\n') for this to properly work. Use `.splitlines(keeplineending=True)`
                 for example when passing block of text to this function.
                 """
                 # NL tokens are used inside multiline expressions, but also after blank
                 # lines or comments. This is intentional - see https://bugs.python.org/issue17061
                 # We want to group the former case together but split the latter, so we
                 # track parentheses level, similar to the internals of tokenize.
                 NEWLINE, NL = tokenize.NEWLINE, tokenize.NL
                 tokens_by_line = [[]]
                 if len(lines) > 1 and not lines[0].endswith(('\n', '\r', '\r\n', '\x0b', '\x0c')):
                     warnings.warn("`make_tokens_by_line` received a list of lines which do not have lineending markers ('\\n', '\\r', '\\r\\n', '\\x0b', '\\x0c'), behavior will be unspecified")
                 parenlev = 0
                 try:
                     for token in tokenize.generate_tokens(iter(lines).__next__):
                         tokens_by_line[-1].append(token)
                         if (token.type == NEWLINE) \
                                 or ((token.type == NL) and (parenlev <= 0)):
                             tokens_by_line.append([])
                         elif token.string in {'(', '[', '{'}:
                             parenlev += 1
                         elif token.string in {')', ']', '}'}:
                             if parenlev > 0:
                                 parenlev -= 1
                 except tokenize.TokenError:
                     # Input ended in a multiline string or expression. That's OK for us.
                     pass
                 if not tokens_by_line[-1]:
                     tokens_by_line.pop()
                 return tokens_by_line
             def show_linewise_tokens(s: str):
                 """For investigation and debugging"""
                 if not s.endswith('\n'):
                     s += '\n'
                 lines = s.splitlines(keepends=True)
                 for line in make_tokens_by_line(lines):
                     print("Line -------")
                     for tokinfo in line:
                         print(" ", tokinfo)
             # Arbitrary limit to prevent getting stuck in infinite loops
             TRANSFORM_LOOP_LIMIT = 500
             class TransformerManager:
                 """Applies various transformations to a cell or code block.
                 The key methods for external use are ``transform_cell()``
                 and ``check_complete()``.
                 """
                 def __init__(self):
                     self.cleanup_transforms = [
                         leading_empty_lines,
                         leading_indent,
                         classic_prompt,
                         ipython_prompt,
                     ]
                     self.line_transforms = [
                         cell_magic,
                     ]
                     self.token_transformers = [
                         MagicAssign,
                         SystemAssign,
                         EscapedCommand,
                         HelpEnd,
                     ]
                 def do_one_token_transform(self, lines):
                     """Find and run the transform earliest in the code.
                     Returns (changed, lines).
                     This method is called repeatedly until changed is False, indicating
                     that all available transformations are complete.
                     The tokens following IPython special syntax might not be valid, so
                     the transformed code is retokenised every time to identify the next
                     piece of special syntax. Hopefully long code cells are mostly valid
                     Python, not using lots of IPython special syntax, so this shouldn't be
                     a performance issue.
                     """
                     tokens_by_line = make_tokens_by_line(lines)
                     candidates = []
                     for transformer_cls in self.token_transformers:
                         transformer = transformer_cls.find(tokens_by_line)
                         if transformer:
                             candidates.append(transformer)
                     if not candidates:
                         # Nothing to transform
                         return False, lines
                     ordered_transformers = sorted(candidates, key=TokenTransformBase.sortby)
                     for transformer in ordered_transformers:
                         try:
                             return True, transformer.transform(lines)
                         except SyntaxError:
                             pass
                     return False, lines
                 def do_token_transforms(self, lines):
                     for _ in range(TRANSFORM_LOOP_LIMIT):
                         changed, lines = self.do_one_token_transform(lines)
                         if not changed:
                             return lines
                     raise RuntimeError("Input transformation still changing after "
                                        "%d iterations. Aborting." % TRANSFORM_LOOP_LIMIT)
                 def transform_cell(self, cell: str) -> str:
                     """Transforms a cell of input code"""
                     if not cell.endswith('\n'):
                         cell += '\n'  # Ensure the cell has a trailing newline
                     lines = cell.splitlines(keepends=True)
                     for transform in self.cleanup_transforms + self.line_transforms:
                         lines = transform(lines)
                     lines = self.do_token_transforms(lines)
                     return ''.join(lines)
                 def check_complete(self, cell: str):
                     """Return whether a block of code is ready to execute, or should be continued
                     Parameters
                     ----------
                     source : string
                       Python input code, which can be multiline.
                     Returns
                     -------
                     status : str
                       One of 'complete', 'incomplete', or 'invalid' if source is not a
                       prefix of valid code.
                     indent_spaces : int or None
                       The number of spaces by which to indent the next line of code. If
                       status is not 'incomplete', this is None.
                     """
                     # Remember if the lines ends in a new line.
                     ends_with_newline = False
                     for character in reversed(cell):
                         if character == '\n':
                             ends_with_newline = True
                             break
                         elif character.strip():
                             break
                         else:
                             continue
                     if not ends_with_newline:
                         # Append an newline for consistent tokenization
                         # See https://bugs.python.org/issue33899
                         cell += '\n'
                     lines = cell.splitlines(keepends=True)
                     if not lines:
                         return 'complete', None
                     if lines[-1].endswith('\\'):
                         # Explicit backslash continuation
                         return 'incomplete', find_last_indent(lines)
                     try:
                         for transform in self.cleanup_transforms:
                             if not getattr(transform, 'has_side_effects', False):
                                 lines = transform(lines)
                     except SyntaxError:
                         return 'invalid', None
                     if lines[0].startswith('%%'):
                         # Special case for cell magics - completion marked by blank line
                         if lines[-1].strip():
                             return 'incomplete', find_last_indent(lines)
                         else:
                             return 'complete', None
                     try:
                         for transform in self.line_transforms:
                             if not getattr(transform, 'has_side_effects', False):
                                 lines = transform(lines)
                         lines = self.do_token_transforms(lines)
                     except SyntaxError:
                         return 'invalid', None
                     tokens_by_line = make_tokens_by_line(lines)
                     if not tokens_by_line:
                         return 'incomplete', find_last_indent(lines)
                     if tokens_by_line[-1][-1].type != tokenize.ENDMARKER:
                         # We're in a multiline string or expression
                         return 'incomplete', find_last_indent(lines)
                     newline_types = {tokenize.NEWLINE, tokenize.COMMENT, tokenize.ENDMARKER}
                     # Pop the last line which only contains DEDENTs and ENDMARKER
                     last_token_line = None
                     if {t.type for t in tokens_by_line[-1]} in [
                         {tokenize.DEDENT, tokenize.ENDMARKER},
                         {tokenize.ENDMARKER}
                     ] and len(tokens_by_line) > 1:
                         last_token_line = tokens_by_line.pop()
                     while tokens_by_line[-1] and tokens_by_line[-1][-1].type in newline_types:
                         tokens_by_line[-1].pop()
                     if not tokens_by_line[-1]:
                         return 'incomplete', find_last_indent(lines)
                     if tokens_by_line[-1][-1].string == ':':
                         # The last line starts a block (e.g. 'if foo:')
                         ix = 0
                         while tokens_by_line[-1][ix].type in {tokenize.INDENT, tokenize.DEDENT}:
                             ix += 1
                         indent = tokens_by_line[-1][ix].start[1]
                         return 'incomplete', indent + 4
                     if tokens_by_line[-1][0].line.endswith('\\'):
                         return 'incomplete', None
                     # At this point, our checks think the code is complete (or invalid).
                     # We'll use codeop.compile_command to check this with the real parser
                     try:
                         with warnings.catch_warnings():
                             warnings.simplefilter('error', SyntaxWarning)
                             res = compile_command(''.join(lines), symbol='exec')
                     except (SyntaxError, OverflowError, ValueError, TypeError,
                             MemoryError, SyntaxWarning):
                         return 'invalid', None
                     else:
                         if res is None:
                             return 'incomplete', find_last_indent(lines)
                     if last_token_line and last_token_line[0].type == tokenize.DEDENT:
                         if ends_with_newline:
                             return 'complete', None
                         return 'incomplete', find_last_indent(lines)
                     # If there's a blank line at the end, assume we're ready to execute
                     if not lines[-1].strip():
                         return 'complete', None
                     return 'complete', None
             def find_last_indent(lines):
                 m = _indent_re.match(lines[-1])
                 if not m:
                     return 0
                 return len(m.group(0).replace('\t', ' '*4))