upstream/ipython Commit - r25960:e869c779

1

"""Input transformer machinery to support IPython special syntax.

1

"""Input transformer machinery to support IPython special syntax.

2

3

This includes the machinery to recognise and transform ``%magic`` commands,

3

This includes the machinery to recognise and transform ``%magic`` commands,

4

``!system`` commands, ``help?`` querying, prompt stripping, and so forth.

4

``!system`` commands, ``help?`` querying, prompt stripping, and so forth.

5

6

Added: IPython 7.0. Replaces inputsplitter and inputtransformer which were

6

Added: IPython 7.0. Replaces inputsplitter and inputtransformer which were

7

deprecated in 7.0.

7

deprecated in 7.0.

8

"""

8

"""

9

10

# Copyright (c) IPython Development Team.

10

# Copyright (c) IPython Development Team.

11

# Distributed under the terms of the Modified BSD License.

11

# Distributed under the terms of the Modified BSD License.

12

13

from codeop import compile_command

13

from codeop import compile_command

14

import re

14

import re

15

import tokenize

15

import tokenize

16

from typing import List, Tuple, Optional, Any

16

from typing import List, Tuple, Optional, Any

17

import warnings

17

import warnings

18

19

_indent_re = re.compile(r'^[ \t]+')

19

_indent_re = re.compile(r'^[ \t]+')

20

21

def leading_empty_lines(lines):

21

def leading_empty_lines(lines):

22

"""Remove leading empty lines

22

"""Remove leading empty lines

23

24

If the leading lines are empty or contain only whitespace, they will be

24

If the leading lines are empty or contain only whitespace, they will be

25

removed.

25

removed.

26

"""

26

"""

27

if not lines:

27

if not lines:

28

return lines

28

return lines

29

for i, line in enumerate(lines):

29

for i, line in enumerate(lines):

30

if line and not line.isspace():

30

if line and not line.isspace():

31

return lines[i:]

31

return lines[i:]

32

return lines

32

return lines

33

34

def leading_indent(lines):

34

def leading_indent(lines):

35

"""Remove leading indentation.

35

"""Remove leading indentation.

36

37

If the first line starts with a spaces or tabs, the same whitespace will be

37

If the first line starts with a spaces or tabs, the same whitespace will be

38

removed from each following line in the cell.

38

removed from each following line in the cell.

39

"""

39

"""

40

if not lines:

40

if not lines:

41

return lines

41

return lines

42

m = _indent_re.match(lines[0])

42

m = _indent_re.match(lines[0])

43

if not m:

43

if not m:

44

return lines

44

return lines

45

space = m.group(0)

45

space = m.group(0)

46

n = len(space)

46

n = len(space)

47

return [l[n:] if l.startswith(space) else l

47

return [l[n:] if l.startswith(space) else l

48

for l in lines]

48

for l in lines]

49

50

class PromptStripper:

50

class PromptStripper:

51

"""Remove matching input prompts from a block of input.

51

"""Remove matching input prompts from a block of input.

52

53

Parameters

53

Parameters

54

----------

54

----------

55

prompt_re : regular expression

55

prompt_re : regular expression

56

A regular expression matching any input prompt (including continuation,

56

A regular expression matching any input prompt (including continuation,

57

e.g. ``...``)

57

e.g. ``...``)

58

initial_re : regular expression, optional

58

initial_re : regular expression, optional

59

A regular expression matching only the initial prompt, but not continuation.

59

A regular expression matching only the initial prompt, but not continuation.

60

If no initial expression is given, prompt_re will be used everywhere.

60

If no initial expression is given, prompt_re will be used everywhere.

61

Used mainly for plain Python prompts (``>>>``), where the continuation prompt

61

Used mainly for plain Python prompts (``>>>``), where the continuation prompt

62

``...`` is a valid Python expression in Python 3, so shouldn't be stripped.

62

``...`` is a valid Python expression in Python 3, so shouldn't be stripped.

63

64

Notes

65

-----

66

64

If initial_re and prompt_re differ,

67

If initial_re and prompt_re differ,

65

only initial_re will be tested against the first line.

68

only initial_re will be tested against the first line.

66

If any prompt is found on the first two lines,

69

If any prompt is found on the first two lines,

67

prompts will be stripped from the rest of the block.

70

prompts will be stripped from the rest of the block.

68

"""

71

"""

69

def __init__(self, prompt_re, initial_re=None):

72

def __init__(self, prompt_re, initial_re=None):

70

self.prompt_re = prompt_re

73

self.prompt_re = prompt_re

71

self.initial_re = initial_re or prompt_re

74

self.initial_re = initial_re or prompt_re

72

75

73

def _strip(self, lines):

76

def _strip(self, lines):

74

return [self.prompt_re.sub('', l, count=1) for l in lines]

77

return [self.prompt_re.sub('', l, count=1) for l in lines]

75

78

76

def __call__(self, lines):

79

def __call__(self, lines):

77

if not lines:

80

if not lines:

78

return lines

81

return lines

79

if self.initial_re.match(lines[0]) or \

82

if self.initial_re.match(lines[0]) or \

80

(len(lines) > 1 and self.prompt_re.match(lines[1])):

83

(len(lines) > 1 and self.prompt_re.match(lines[1])):

81

return self._strip(lines)

84

return self._strip(lines)

82

return lines

85

return lines

83

86

84

classic_prompt = PromptStripper(

87

classic_prompt = PromptStripper(

85

prompt_re=re.compile(r'^(>>>|\.\.\.)( |$)'),

88

prompt_re=re.compile(r'^(>>>|\.\.\.)( |$)'),

86

initial_re=re.compile(r'^>>>( |$)')

89

initial_re=re.compile(r'^>>>( |$)')

87

)

90

)

88

91

89

ipython_prompt = PromptStripper(re.compile(r'^(In \[\d+\]: |\s*\.{3,}: ?)'))

92

ipython_prompt = PromptStripper(re.compile(r'^(In \[\d+\]: |\s*\.{3,}: ?)'))

90

93

91

def cell_magic(lines):

94

def cell_magic(lines):

92

if not lines or not lines[0].startswith('%%'):

95

if not lines or not lines[0].startswith('%%'):

93

return lines

96

return lines

94

if re.match(r'%%\w+\?', lines[0]):

97

if re.match(r'%%\w+\?', lines[0]):

95

# This case will be handled by help_end

98

# This case will be handled by help_end

96

return lines

99

return lines

97

magic_name, _, first_line = lines[0][2:].rstrip().partition(' ')

100

magic_name, _, first_line = lines[0][2:].rstrip().partition(' ')

98

body = ''.join(lines[1:])

101

body = ''.join(lines[1:])

99

return ['get_ipython().run_cell_magic(%r, %r, %r)\n'

102

return ['get_ipython().run_cell_magic(%r, %r, %r)\n'

100

% (magic_name, first_line, body)]

103

% (magic_name, first_line, body)]

101

104

102

105

103

def _find_assign_op(token_line) -> Optional[int]:

106

def _find_assign_op(token_line) -> Optional[int]:

104

"""Get the index of the first assignment in the line ('=' not inside brackets)

107

"""Get the index of the first assignment in the line ('=' not inside brackets)

105

108

106

Note: We don't try to support multiple special assignment (a = b = %foo)

109

Note: We don't try to support multiple special assignment (a = b = %foo)

107

"""

110

"""

108

paren_level = 0

111

paren_level = 0

109

for i, ti in enumerate(token_line):

112

for i, ti in enumerate(token_line):

110

s = ti.string

113

s = ti.string

111

if s == '=' and paren_level == 0:

114

if s == '=' and paren_level == 0:

112

return i

115

return i

113

if s in {'(','[','{'}:

116

if s in {'(','[','{'}:

114

paren_level += 1

117

paren_level += 1

115

elif s in {')', ']', '}'}:

118

elif s in {')', ']', '}'}:

116

if paren_level > 0:

119

if paren_level > 0:

117

paren_level -= 1

120

paren_level -= 1

118

return None

121

return None

119

122

120

def find_end_of_continued_line(lines, start_line: int):

123

def find_end_of_continued_line(lines, start_line: int):

121

"""Find the last line of a line explicitly extended using backslashes.

124

"""Find the last line of a line explicitly extended using backslashes.

122

125

123

Uses 0-indexed line numbers.

126

Uses 0-indexed line numbers.

124

"""

127

"""

125

end_line = start_line

128

end_line = start_line

126

while lines[end_line].endswith('\\\n'):

129

while lines[end_line].endswith('\\\n'):

127

end_line += 1

130

end_line += 1

128

if end_line >= len(lines):

131

if end_line >= len(lines):

129

break

132

break

130

return end_line

133

return end_line

131

134

132

def assemble_continued_line(lines, start: Tuple[int, int], end_line: int):

135

def assemble_continued_line(lines, start: Tuple[int, int], end_line: int):

133

r"""Assemble a single line from multiple continued line pieces

136

r"""Assemble a single line from multiple continued line pieces

134

137

135

Continued lines are lines ending in ``\``, and the line following the last

138

Continued lines are lines ending in ``\``, and the line following the last

136

``\`` in the block.

139

``\`` in the block.

137

140

138

For example, this code continues over multiple lines::

141

For example, this code continues over multiple lines::

139

142

140

if (assign_ix is not None) \

143

if (assign_ix is not None) \

141

and (len(line) >= assign_ix + 2) \

144

and (len(line) >= assign_ix + 2) \

142

and (line[assign_ix+1].string == '%') \

145

and (line[assign_ix+1].string == '%') \

143

and (line[assign_ix+2].type == tokenize.NAME):

146

and (line[assign_ix+2].type == tokenize.NAME):

144

147

145

This statement contains four continued line pieces.

148

This statement contains four continued line pieces.

146

Assembling these pieces into a single line would give::

149

Assembling these pieces into a single line would give::

147

150

148

if (assign_ix is not None) and (len(line) >= assign_ix + 2) and (line[...

151

if (assign_ix is not None) and (len(line) >= assign_ix + 2) and (line[...

149

152

150

This uses 0-indexed line numbers. *start* is (lineno, colno).

153

This uses 0-indexed line numbers. *start* is (lineno, colno).

151

154

152

Used to allow ``%magic`` and ``!system`` commands to be continued over

155

Used to allow ``%magic`` and ``!system`` commands to be continued over

153

multiple lines.

156

multiple lines.

154

"""

157

"""

155

parts = [lines[start[0]][start[1]:]] + lines[start[0]+1:end_line+1]

158

parts = [lines[start[0]][start[1]:]] + lines[start[0]+1:end_line+1]

156

return ' '.join([p.rstrip()[:-1] for p in parts[:-1]] # Strip backslash+newline

159

return ' '.join([p.rstrip()[:-1] for p in parts[:-1]] # Strip backslash+newline

157

+ [parts[-1].rstrip()]) # Strip newline from last line

160

+ [parts[-1].rstrip()]) # Strip newline from last line

158

161

159

class TokenTransformBase:

162

class TokenTransformBase:

160

"""Base class for transformations which examine tokens.

163

"""Base class for transformations which examine tokens.

161

164

162

Special syntax should not be transformed when it occurs inside strings or

165

Special syntax should not be transformed when it occurs inside strings or

163

comments. This is hard to reliably avoid with regexes. The solution is to

166

comments. This is hard to reliably avoid with regexes. The solution is to

164

tokenise the code as Python, and recognise the special syntax in the tokens.

167

tokenise the code as Python, and recognise the special syntax in the tokens.

165

168

166

IPython's special syntax is not valid Python syntax, so tokenising may go

169

IPython's special syntax is not valid Python syntax, so tokenising may go

167

wrong after the special syntax starts. These classes therefore find and

170

wrong after the special syntax starts. These classes therefore find and

168

transform *one* instance of special syntax at a time into regular Python

171

transform *one* instance of special syntax at a time into regular Python

169

syntax. After each transformation, tokens are regenerated to find the next

172

syntax. After each transformation, tokens are regenerated to find the next

170

piece of special syntax.

173

piece of special syntax.

171

174

172

Subclasses need to implement one class method (find)

175

Subclasses need to implement one class method (find)

173

and one regular method (transform).

176

and one regular method (transform).

174

177

175

The priority attribute can select which transformation to apply if multiple

178

The priority attribute can select which transformation to apply if multiple

176

transformers match in the same place. Lower numbers have higher priority.

179

transformers match in the same place. Lower numbers have higher priority.

177

This allows "%magic?" to be turned into a help call rather than a magic call.

180

This allows "%magic?" to be turned into a help call rather than a magic call.

178

"""

181

"""

179

# Lower numbers -> higher priority (for matches in the same location)

182

# Lower numbers -> higher priority (for matches in the same location)

180

priority = 10

183

priority = 10

181

184

182

def sortby(self):

185

def sortby(self):

183

return self.start_line, self.start_col, self.priority

186

return self.start_line, self.start_col, self.priority

184

187

185

def __init__(self, start):

188

def __init__(self, start):

186

self.start_line = start[0] - 1 # Shift from 1-index to 0-index

189

self.start_line = start[0] - 1 # Shift from 1-index to 0-index

187

self.start_col = start[1]

190

self.start_col = start[1]

188

191

189

@classmethod

192

@classmethod

190

def find(cls, tokens_by_line):

193

def find(cls, tokens_by_line):

191

"""Find one instance of special syntax in the provided tokens.

194

"""Find one instance of special syntax in the provided tokens.

192

195

193

Tokens are grouped into logical lines for convenience,

196

Tokens are grouped into logical lines for convenience,

194

so it is easy to e.g. look at the first token of each line.

197

so it is easy to e.g. look at the first token of each line.

195

*tokens_by_line* is a list of lists of tokenize.TokenInfo objects.

198

*tokens_by_line* is a list of lists of tokenize.TokenInfo objects.

196

199

197

This should return an instance of its class, pointing to the start

200

This should return an instance of its class, pointing to the start

198

position it has found, or None if it found no match.

201

position it has found, or None if it found no match.

199

"""

202

"""

200

raise NotImplementedError

203

raise NotImplementedError

201

204

202

def transform(self, lines: List[str]):

205

def transform(self, lines: List[str]):

203

"""Transform one instance of special syntax found by ``find()``

206

"""Transform one instance of special syntax found by ``find()``

204

207

205

Takes a list of strings representing physical lines,

208

Takes a list of strings representing physical lines,

206

returns a similar list of transformed lines.

209

returns a similar list of transformed lines.

207

"""

210

"""

208

raise NotImplementedError

211

raise NotImplementedError

209

212

210

class MagicAssign(TokenTransformBase):

213

class MagicAssign(TokenTransformBase):

211

"""Transformer for assignments from magics (a = %foo)"""

214

"""Transformer for assignments from magics (a = %foo)"""

212

@classmethod

215

@classmethod

213

def find(cls, tokens_by_line):

216

def find(cls, tokens_by_line):

214

"""Find the first magic assignment (a = %foo) in the cell.

217

"""Find the first magic assignment (a = %foo) in the cell.

215

"""

218

"""

216

for line in tokens_by_line:

219

for line in tokens_by_line:

217

assign_ix = _find_assign_op(line)

220

assign_ix = _find_assign_op(line)

218

if (assign_ix is not None) \

221

if (assign_ix is not None) \

219

and (len(line) >= assign_ix + 2) \

222

and (len(line) >= assign_ix + 2) \

220

and (line[assign_ix+1].string == '%') \

223

and (line[assign_ix+1].string == '%') \

221

and (line[assign_ix+2].type == tokenize.NAME):

224

and (line[assign_ix+2].type == tokenize.NAME):

222

return cls(line[assign_ix+1].start)

225

return cls(line[assign_ix+1].start)

223

226

224

def transform(self, lines: List[str]):

227

def transform(self, lines: List[str]):

225

"""Transform a magic assignment found by the ``find()`` classmethod.

228

"""Transform a magic assignment found by the ``find()`` classmethod.

226

"""

229

"""

227

start_line, start_col = self.start_line, self.start_col

230

start_line, start_col = self.start_line, self.start_col

228

lhs = lines[start_line][:start_col]

231

lhs = lines[start_line][:start_col]

229

end_line = find_end_of_continued_line(lines, start_line)

232

end_line = find_end_of_continued_line(lines, start_line)

230

rhs = assemble_continued_line(lines, (start_line, start_col), end_line)

233

rhs = assemble_continued_line(lines, (start_line, start_col), end_line)

231

assert rhs.startswith('%'), rhs

234

assert rhs.startswith('%'), rhs

232

magic_name, _, args = rhs[1:].partition(' ')

235

magic_name, _, args = rhs[1:].partition(' ')

233

236

234

lines_before = lines[:start_line]

237

lines_before = lines[:start_line]

235

call = "get_ipython().run_line_magic({!r}, {!r})".format(magic_name, args)

238

call = "get_ipython().run_line_magic({!r}, {!r})".format(magic_name, args)

236

new_line = lhs + call + '\n'

239

new_line = lhs + call + '\n'

237

lines_after = lines[end_line+1:]

240

lines_after = lines[end_line+1:]

238

241

239

return lines_before + [new_line] + lines_after

242

return lines_before + [new_line] + lines_after

240

243

241

244

242

class SystemAssign(TokenTransformBase):

245

class SystemAssign(TokenTransformBase):

243

"""Transformer for assignments from system commands (a = !foo)"""

246

"""Transformer for assignments from system commands (a = !foo)"""

244

@classmethod

247

@classmethod

245

def find(cls, tokens_by_line):

248

def find(cls, tokens_by_line):

246

"""Find the first system assignment (a = !foo) in the cell.

249

"""Find the first system assignment (a = !foo) in the cell.

247

"""

250

"""

248

for line in tokens_by_line:

251

for line in tokens_by_line:

249

assign_ix = _find_assign_op(line)

252

assign_ix = _find_assign_op(line)

250

if (assign_ix is not None) \

253

if (assign_ix is not None) \

251

and not line[assign_ix].line.strip().startswith('=') \

254

and not line[assign_ix].line.strip().startswith('=') \

252

and (len(line) >= assign_ix + 2) \

255

and (len(line) >= assign_ix + 2) \

253

and (line[assign_ix + 1].type == tokenize.ERRORTOKEN):

256

and (line[assign_ix + 1].type == tokenize.ERRORTOKEN):

254

ix = assign_ix + 1

257

ix = assign_ix + 1

255

258

256

while ix < len(line) and line[ix].type == tokenize.ERRORTOKEN:

259

while ix < len(line) and line[ix].type == tokenize.ERRORTOKEN:

257

if line[ix].string == '!':

260

if line[ix].string == '!':

258

return cls(line[ix].start)

261

return cls(line[ix].start)

259

elif not line[ix].string.isspace():

262

elif not line[ix].string.isspace():

260

break

263

break

261

ix += 1

264

ix += 1

262

265

263

def transform(self, lines: List[str]):

266

def transform(self, lines: List[str]):

264

"""Transform a system assignment found by the ``find()`` classmethod.

267

"""Transform a system assignment found by the ``find()`` classmethod.

265

"""

268

"""

266

start_line, start_col = self.start_line, self.start_col

269

start_line, start_col = self.start_line, self.start_col

267

270

268

lhs = lines[start_line][:start_col]

271

lhs = lines[start_line][:start_col]

269

end_line = find_end_of_continued_line(lines, start_line)

272

end_line = find_end_of_continued_line(lines, start_line)

270

rhs = assemble_continued_line(lines, (start_line, start_col), end_line)

273

rhs = assemble_continued_line(lines, (start_line, start_col), end_line)

271

assert rhs.startswith('!'), rhs

274

assert rhs.startswith('!'), rhs

272

cmd = rhs[1:]

275

cmd = rhs[1:]

273

276

274

lines_before = lines[:start_line]

277

lines_before = lines[:start_line]

275

call = "get_ipython().getoutput({!r})".format(cmd)

278

call = "get_ipython().getoutput({!r})".format(cmd)

276

new_line = lhs + call + '\n'

279

new_line = lhs + call + '\n'

277

lines_after = lines[end_line + 1:]

280

lines_after = lines[end_line + 1:]

278

281

279

return lines_before + [new_line] + lines_after

282

return lines_before + [new_line] + lines_after

280

283

281

# The escape sequences that define the syntax transformations IPython will

284

# The escape sequences that define the syntax transformations IPython will

282

# apply to user input. These can NOT be just changed here: many regular

285

# apply to user input. These can NOT be just changed here: many regular

283

# expressions and other parts of the code may use their hardcoded values, and

286

# expressions and other parts of the code may use their hardcoded values, and

284

# for all intents and purposes they constitute the 'IPython syntax', so they

287

# for all intents and purposes they constitute the 'IPython syntax', so they

285

# should be considered fixed.

288

# should be considered fixed.

286

289

287

ESC_SHELL = '!' # Send line to underlying system shell

290

ESC_SHELL = '!' # Send line to underlying system shell

288

ESC_SH_CAP = '!!' # Send line to system shell and capture output

291

ESC_SH_CAP = '!!' # Send line to system shell and capture output

289

ESC_HELP = '?' # Find information about object

292

ESC_HELP = '?' # Find information about object

290

ESC_HELP2 = '??' # Find extra-detailed information about object

293

ESC_HELP2 = '??' # Find extra-detailed information about object

291

ESC_MAGIC = '%' # Call magic function

294

ESC_MAGIC = '%' # Call magic function

292

ESC_MAGIC2 = '%%' # Call cell-magic function

295

ESC_MAGIC2 = '%%' # Call cell-magic function

293

ESC_QUOTE = ',' # Split args on whitespace, quote each as string and call

296

ESC_QUOTE = ',' # Split args on whitespace, quote each as string and call

294

ESC_QUOTE2 = ';' # Quote all args as a single string, call

297

ESC_QUOTE2 = ';' # Quote all args as a single string, call

295

ESC_PAREN = '/' # Call first argument with rest of line as arguments

298

ESC_PAREN = '/' # Call first argument with rest of line as arguments

296

299

297

ESCAPE_SINGLES = {'!', '?', '%', ',', ';', '/'}

300

ESCAPE_SINGLES = {'!', '?', '%', ',', ';', '/'}

298

ESCAPE_DOUBLES = {'!!', '??'} # %% (cell magic) is handled separately

301

ESCAPE_DOUBLES = {'!!', '??'} # %% (cell magic) is handled separately

299

302

300

def _make_help_call(target, esc, next_input=None):

303

def _make_help_call(target, esc, next_input=None):

301

"""Prepares a pinfo(2)/psearch call from a target name and the escape

304

"""Prepares a pinfo(2)/psearch call from a target name and the escape

302

(i.e. ? or ??)"""

305

(i.e. ? or ??)"""

303

method = 'pinfo2' if esc == '??' \

306

method = 'pinfo2' if esc == '??' \

304

else 'psearch' if '*' in target \

307

else 'psearch' if '*' in target \

305

else 'pinfo'

308

else 'pinfo'

306

arg = " ".join([method, target])

309

arg = " ".join([method, target])

307

#Prepare arguments for get_ipython().run_line_magic(magic_name, magic_args)

310

#Prepare arguments for get_ipython().run_line_magic(magic_name, magic_args)

308

t_magic_name, _, t_magic_arg_s = arg.partition(' ')

311

t_magic_name, _, t_magic_arg_s = arg.partition(' ')

309

t_magic_name = t_magic_name.lstrip(ESC_MAGIC)

312

t_magic_name = t_magic_name.lstrip(ESC_MAGIC)

310

if next_input is None:

313

if next_input is None:

311

return 'get_ipython().run_line_magic(%r, %r)' % (t_magic_name, t_magic_arg_s)

314

return 'get_ipython().run_line_magic(%r, %r)' % (t_magic_name, t_magic_arg_s)

312

else:

315

else:

313

return 'get_ipython().set_next_input(%r);get_ipython().run_line_magic(%r, %r)' % \

316

return 'get_ipython().set_next_input(%r);get_ipython().run_line_magic(%r, %r)' % \

314

(next_input, t_magic_name, t_magic_arg_s)

317

(next_input, t_magic_name, t_magic_arg_s)

315

318

316

def _tr_help(content):

319

def _tr_help(content):

317

"""Translate lines escaped with: ?

320

"""Translate lines escaped with: ?

318

321

319

A naked help line should fire the intro help screen (shell.show_usage())

322

A naked help line should fire the intro help screen (shell.show_usage())

320

"""

323

"""

321

if not content:

324

if not content:

322

return 'get_ipython().show_usage()'

325

return 'get_ipython().show_usage()'

323

326

324

return _make_help_call(content, '?')

327

return _make_help_call(content, '?')

325

328

326

def _tr_help2(content):

329

def _tr_help2(content):

327

"""Translate lines escaped with: ??

330

"""Translate lines escaped with: ??

328

331

329

A naked help line should fire the intro help screen (shell.show_usage())

332

A naked help line should fire the intro help screen (shell.show_usage())

330

"""

333

"""

331

if not content:

334

if not content:

332

return 'get_ipython().show_usage()'

335

return 'get_ipython().show_usage()'

333

336

334

return _make_help_call(content, '??')

337

return _make_help_call(content, '??')

335

338

336

def _tr_magic(content):

339

def _tr_magic(content):

337

"Translate lines escaped with a percent sign: %"

340

"Translate lines escaped with a percent sign: %"

338

name, _, args = content.partition(' ')

341

name, _, args = content.partition(' ')

339

return 'get_ipython().run_line_magic(%r, %r)' % (name, args)

342

return 'get_ipython().run_line_magic(%r, %r)' % (name, args)

340

343

341

def _tr_quote(content):

344

def _tr_quote(content):

342

"Translate lines escaped with a comma: ,"

345

"Translate lines escaped with a comma: ,"

343

name, _, args = content.partition(' ')

346

name, _, args = content.partition(' ')

344

return '%s("%s")' % (name, '", "'.join(args.split()) )

347

return '%s("%s")' % (name, '", "'.join(args.split()) )

345

348

346

def _tr_quote2(content):

349

def _tr_quote2(content):

347

"Translate lines escaped with a semicolon: ;"

350

"Translate lines escaped with a semicolon: ;"

348

name, _, args = content.partition(' ')

351

name, _, args = content.partition(' ')

349

return '%s("%s")' % (name, args)

352

return '%s("%s")' % (name, args)

350

353

351

def _tr_paren(content):

354

def _tr_paren(content):

352

"Translate lines escaped with a slash: /"

355

"Translate lines escaped with a slash: /"

353

name, _, args = content.partition(' ')

356

name, _, args = content.partition(' ')

354

return '%s(%s)' % (name, ", ".join(args.split()))

357

return '%s(%s)' % (name, ", ".join(args.split()))

355

358

356

tr = { ESC_SHELL : 'get_ipython().system({!r})'.format,

359

tr = { ESC_SHELL : 'get_ipython().system({!r})'.format,

357

ESC_SH_CAP : 'get_ipython().getoutput({!r})'.format,

360

ESC_SH_CAP : 'get_ipython().getoutput({!r})'.format,

358

ESC_HELP : _tr_help,

361

ESC_HELP : _tr_help,

359

ESC_HELP2 : _tr_help2,

362

ESC_HELP2 : _tr_help2,

360

ESC_MAGIC : _tr_magic,

363

ESC_MAGIC : _tr_magic,

361

ESC_QUOTE : _tr_quote,

364

ESC_QUOTE : _tr_quote,

362

ESC_QUOTE2 : _tr_quote2,

365

ESC_QUOTE2 : _tr_quote2,

363

ESC_PAREN : _tr_paren }

366

ESC_PAREN : _tr_paren }

364

367

365

class EscapedCommand(TokenTransformBase):

368

class EscapedCommand(TokenTransformBase):

366

"""Transformer for escaped commands like %foo, !foo, or /foo"""

369

"""Transformer for escaped commands like %foo, !foo, or /foo"""

367

@classmethod

370

@classmethod

368

def find(cls, tokens_by_line):

371

def find(cls, tokens_by_line):

369

"""Find the first escaped command (%foo, !foo, etc.) in the cell.

372

"""Find the first escaped command (%foo, !foo, etc.) in the cell.

370

"""

373

"""

371

for line in tokens_by_line:

374

for line in tokens_by_line:

372

if not line:

375

if not line:

373

continue

376

continue

374

ix = 0

377

ix = 0

375

ll = len(line)

378

ll = len(line)

376

while ll > ix and line[ix].type in {tokenize.INDENT, tokenize.DEDENT}:

379

while ll > ix and line[ix].type in {tokenize.INDENT, tokenize.DEDENT}:

377

ix += 1

380

ix += 1

378

if ix >= ll:

381

if ix >= ll:

379

continue

382

continue

380

if line[ix].string in ESCAPE_SINGLES:

383

if line[ix].string in ESCAPE_SINGLES:

381

return cls(line[ix].start)

384

return cls(line[ix].start)

382

385

383

def transform(self, lines):

386

def transform(self, lines):

384

"""Transform an escaped line found by the ``find()`` classmethod.

387

"""Transform an escaped line found by the ``find()`` classmethod.

385

"""

388

"""

386

start_line, start_col = self.start_line, self.start_col

389

start_line, start_col = self.start_line, self.start_col

387

390

388

indent = lines[start_line][:start_col]

391

indent = lines[start_line][:start_col]

389

end_line = find_end_of_continued_line(lines, start_line)

392

end_line = find_end_of_continued_line(lines, start_line)

390

line = assemble_continued_line(lines, (start_line, start_col), end_line)

393

line = assemble_continued_line(lines, (start_line, start_col), end_line)

391

394

392

if len(line) > 1 and line[:2] in ESCAPE_DOUBLES:

395

if len(line) > 1 and line[:2] in ESCAPE_DOUBLES:

393

escape, content = line[:2], line[2:]

396

escape, content = line[:2], line[2:]

394

else:

397

else:

395

escape, content = line[:1], line[1:]

398

escape, content = line[:1], line[1:]

396

399

397

if escape in tr:

400

if escape in tr:

398

call = tr[escape](content)

401

call = tr[escape](content)

399

else:

402

else:

400

call = ''

403

call = ''

401

404

402

lines_before = lines[:start_line]

405

lines_before = lines[:start_line]

403

new_line = indent + call + '\n'

406

new_line = indent + call + '\n'

404

lines_after = lines[end_line + 1:]

407

lines_after = lines[end_line + 1:]

405

408

406

return lines_before + [new_line] + lines_after

409

return lines_before + [new_line] + lines_after

407

410

408

_help_end_re = re.compile(r"""(%{0,2}

411

_help_end_re = re.compile(r"""(%{0,2}

409

(?!\d)[\w*]+ # Variable name

412

(?!\d)[\w*]+ # Variable name

410

(\.(?!\d)[\w*]+)* # .etc.etc

413

(\.(?!\d)[\w*]+)* # .etc.etc

411

)

414

)

412

(\?\??)$ # ? or ??

415

(\?\??)$ # ? or ??

413

""",

416

""",

414

re.VERBOSE)

417

re.VERBOSE)

415

418

416

class HelpEnd(TokenTransformBase):

419

class HelpEnd(TokenTransformBase):

417

"""Transformer for help syntax: obj? and obj??"""

420

"""Transformer for help syntax: obj? and obj??"""

418

# This needs to be higher priority (lower number) than EscapedCommand so

421

# This needs to be higher priority (lower number) than EscapedCommand so

419

# that inspecting magics (%foo?) works.

422

# that inspecting magics (%foo?) works.

420

priority = 5

423

priority = 5

421

424

422

def __init__(self, start, q_locn):

425

def __init__(self, start, q_locn):

423

super().__init__(start)

426

super().__init__(start)

424

self.q_line = q_locn[0] - 1 # Shift from 1-indexed to 0-indexed

427

self.q_line = q_locn[0] - 1 # Shift from 1-indexed to 0-indexed

425

self.q_col = q_locn[1]

428

self.q_col = q_locn[1]

426

429

427

@classmethod

430

@classmethod

428

def find(cls, tokens_by_line):

431

def find(cls, tokens_by_line):

429

"""Find the first help command (foo?) in the cell.

432

"""Find the first help command (foo?) in the cell.

430

"""

433

"""

431

for line in tokens_by_line:

434

for line in tokens_by_line:

432

# Last token is NEWLINE; look at last but one

435

# Last token is NEWLINE; look at last but one

433

if len(line) > 2 and line[-2].string == '?':

436

if len(line) > 2 and line[-2].string == '?':

434

# Find the first token that's not INDENT/DEDENT

437

# Find the first token that's not INDENT/DEDENT

435

ix = 0

438

ix = 0

436

while line[ix].type in {tokenize.INDENT, tokenize.DEDENT}:

439

while line[ix].type in {tokenize.INDENT, tokenize.DEDENT}:

437

ix += 1

440

ix += 1

438

return cls(line[ix].start, line[-2].start)

441

return cls(line[ix].start, line[-2].start)

439

442

440

def transform(self, lines):

443

def transform(self, lines):

441

"""Transform a help command found by the ``find()`` classmethod.

444

"""Transform a help command found by the ``find()`` classmethod.

442

"""

445

"""

443

piece = ''.join(lines[self.start_line:self.q_line+1])

446

piece = ''.join(lines[self.start_line:self.q_line+1])

444

indent, content = piece[:self.start_col], piece[self.start_col:]

447

indent, content = piece[:self.start_col], piece[self.start_col:]

445

lines_before = lines[:self.start_line]

448

lines_before = lines[:self.start_line]

446

lines_after = lines[self.q_line + 1:]

449

lines_after = lines[self.q_line + 1:]

447

450

448

m = _help_end_re.search(content)

451

m = _help_end_re.search(content)

449

if not m:

452

if not m:

450

raise SyntaxError(content)

453

raise SyntaxError(content)

451

assert m is not None, content

454

assert m is not None, content

452

target = m.group(1)

455

target = m.group(1)

453

esc = m.group(3)

456

esc = m.group(3)

454

457

455

# If we're mid-command, put it back on the next prompt for the user.

458

# If we're mid-command, put it back on the next prompt for the user.

456

next_input = None

459

next_input = None

457

if (not lines_before) and (not lines_after) \

460

if (not lines_before) and (not lines_after) \

458

and content.strip() != m.group(0):

461

and content.strip() != m.group(0):

459

next_input = content.rstrip('?\n')

462

next_input = content.rstrip('?\n')

460

463

461

call = _make_help_call(target, esc, next_input=next_input)

464

call = _make_help_call(target, esc, next_input=next_input)

462

new_line = indent + call + '\n'

465

new_line = indent + call + '\n'

463

466

464

return lines_before + [new_line] + lines_after

467

return lines_before + [new_line] + lines_after

465

468

466

def make_tokens_by_line(lines:List[str]):

469

def make_tokens_by_line(lines:List[str]):

467

"""Tokenize a series of lines and group tokens by line.

470

"""Tokenize a series of lines and group tokens by line.

468

471

469

The tokens for a multiline Python string or expression are grouped as one

472

The tokens for a multiline Python string or expression are grouped as one

470

line. All lines except the last lines should keep their line ending ('\\n',

473

line. All lines except the last lines should keep their line ending ('\\n',

471

'\\r\\n') for this to properly work. Use `.splitlines(keeplineending=True)`

474

'\\r\\n') for this to properly work. Use `.splitlines(keeplineending=True)`

472

for example when passing block of text to this function.

475

for example when passing block of text to this function.

473

476

474

"""

477

"""

475

# NL tokens are used inside multiline expressions, but also after blank

478

# NL tokens are used inside multiline expressions, but also after blank

476

# lines or comments. This is intentional - see https://bugs.python.org/issue17061

479

# lines or comments. This is intentional - see https://bugs.python.org/issue17061

477

# We want to group the former case together but split the latter, so we

480

# We want to group the former case together but split the latter, so we

478

# track parentheses level, similar to the internals of tokenize.

481

# track parentheses level, similar to the internals of tokenize.

479

482

480

# reexported from token on 3.7+

483

# reexported from token on 3.7+

481

NEWLINE, NL = tokenize.NEWLINE, tokenize.NL # type: ignore

484

NEWLINE, NL = tokenize.NEWLINE, tokenize.NL # type: ignore

482

tokens_by_line:List[List[Any]] = [[]]

485

tokens_by_line:List[List[Any]] = [[]]

483

if len(lines) > 1 and not lines[0].endswith(('\n', '\r', '\r\n', '\x0b', '\x0c')):

486

if len(lines) > 1 and not lines[0].endswith(('\n', '\r', '\r\n', '\x0b', '\x0c')):

484

warnings.warn("`make_tokens_by_line` received a list of lines which do not have lineending markers ('\\n', '\\r', '\\r\\n', '\\x0b', '\\x0c'), behavior will be unspecified")

487

warnings.warn("`make_tokens_by_line` received a list of lines which do not have lineending markers ('\\n', '\\r', '\\r\\n', '\\x0b', '\\x0c'), behavior will be unspecified")

485

parenlev = 0

488

parenlev = 0

486

try:

489

try:

487

for token in tokenize.generate_tokens(iter(lines).__next__):

490

for token in tokenize.generate_tokens(iter(lines).__next__):

488

tokens_by_line[-1].append(token)

491

tokens_by_line[-1].append(token)

489

if (token.type == NEWLINE) \

492

if (token.type == NEWLINE) \

490

or ((token.type == NL) and (parenlev <= 0)):

493

or ((token.type == NL) and (parenlev <= 0)):

491

tokens_by_line.append([])

494

tokens_by_line.append([])

492

elif token.string in {'(', '[', '{'}:

495

elif token.string in {'(', '[', '{'}:

493

parenlev += 1

496

parenlev += 1

494

elif token.string in {')', ']', '}'}:

497

elif token.string in {')', ']', '}'}:

495

if parenlev > 0:

498

if parenlev > 0:

496

parenlev -= 1

499

parenlev -= 1

497

except tokenize.TokenError:

500

except tokenize.TokenError:

498

# Input ended in a multiline string or expression. That's OK for us.

501

# Input ended in a multiline string or expression. That's OK for us.

499

pass

502

pass

500

503

501

504

502

if not tokens_by_line[-1]:

505

if not tokens_by_line[-1]:

503

tokens_by_line.pop()

506

tokens_by_line.pop()

504

507

505

508

506

return tokens_by_line

509

return tokens_by_line

507

510

508

def show_linewise_tokens(s: str):

511

def show_linewise_tokens(s: str):

509

"""For investigation and debugging"""

512

"""For investigation and debugging"""

510

if not s.endswith('\n'):

513

if not s.endswith('\n'):

511

s += '\n'

514

s += '\n'

512

lines = s.splitlines(keepends=True)

515

lines = s.splitlines(keepends=True)

513

for line in make_tokens_by_line(lines):

516

for line in make_tokens_by_line(lines):

514

print("Line -------")

517

print("Line -------")

515

for tokinfo in line:

518

for tokinfo in line:

516

print(" ", tokinfo)

519

print(" ", tokinfo)

517

520

518

# Arbitrary limit to prevent getting stuck in infinite loops

521

# Arbitrary limit to prevent getting stuck in infinite loops

519

TRANSFORM_LOOP_LIMIT = 500

522

TRANSFORM_LOOP_LIMIT = 500

520

523

521

class TransformerManager:

524

class TransformerManager:

522

"""Applies various transformations to a cell or code block.

525

"""Applies various transformations to a cell or code block.

523

526

524

The key methods for external use are ``transform_cell()``

527

The key methods for external use are ``transform_cell()``

525

and ``check_complete()``.

528

and ``check_complete()``.

526

"""

529

"""

527

def __init__(self):

530

def __init__(self):

528

self.cleanup_transforms = [

531

self.cleanup_transforms = [

529

leading_empty_lines,

532

leading_empty_lines,

530

leading_indent,

533

leading_indent,

531

classic_prompt,

534

classic_prompt,

532

ipython_prompt,

535

ipython_prompt,

533

]

536

]

534

self.line_transforms = [

537

self.line_transforms = [

535

cell_magic,

538

cell_magic,

536

]

539

]

537

self.token_transformers = [

540

self.token_transformers = [

538

MagicAssign,

541

MagicAssign,

539

SystemAssign,

542

SystemAssign,

540

EscapedCommand,

543

EscapedCommand,

541

HelpEnd,

544

HelpEnd,

542

]

545

]

543

546

544

def do_one_token_transform(self, lines):

547

def do_one_token_transform(self, lines):

545

"""Find and run the transform earliest in the code.

548

"""Find and run the transform earliest in the code.

546

549

547

Returns (changed, lines).

550

Returns (changed, lines).

548

551

549

This method is called repeatedly until changed is False, indicating

552

This method is called repeatedly until changed is False, indicating

550

that all available transformations are complete.

553

that all available transformations are complete.

551

554

552

The tokens following IPython special syntax might not be valid, so

555

The tokens following IPython special syntax might not be valid, so

553

the transformed code is retokenised every time to identify the next

556

the transformed code is retokenised every time to identify the next

554

piece of special syntax. Hopefully long code cells are mostly valid

557

piece of special syntax. Hopefully long code cells are mostly valid

555

Python, not using lots of IPython special syntax, so this shouldn't be

558

Python, not using lots of IPython special syntax, so this shouldn't be

556

a performance issue.

559

a performance issue.

557

"""

560

"""

558

tokens_by_line = make_tokens_by_line(lines)

561

tokens_by_line = make_tokens_by_line(lines)

559

candidates = []

562

candidates = []

560

for transformer_cls in self.token_transformers:

563

for transformer_cls in self.token_transformers:

561

transformer = transformer_cls.find(tokens_by_line)

564

transformer = transformer_cls.find(tokens_by_line)

562

if transformer:

565

if transformer:

563

candidates.append(transformer)

566

candidates.append(transformer)

564

567

565

if not candidates:

568

if not candidates:

566

# Nothing to transform

569

# Nothing to transform

567

return False, lines

570

return False, lines

568

ordered_transformers = sorted(candidates, key=TokenTransformBase.sortby)

571

ordered_transformers = sorted(candidates, key=TokenTransformBase.sortby)

569

for transformer in ordered_transformers:

572

for transformer in ordered_transformers:

570

try:

573

try:

571

return True, transformer.transform(lines)

574

return True, transformer.transform(lines)

572

except SyntaxError:

575

except SyntaxError:

573

pass

576

pass

574

return False, lines

577

return False, lines

575

578

576

def do_token_transforms(self, lines):

579

def do_token_transforms(self, lines):

577

for _ in range(TRANSFORM_LOOP_LIMIT):

580

for _ in range(TRANSFORM_LOOP_LIMIT):

578

changed, lines = self.do_one_token_transform(lines)

581

changed, lines = self.do_one_token_transform(lines)

579

if not changed:

582

if not changed:

580

return lines

583

return lines

581

584

582

raise RuntimeError("Input transformation still changing after "

585

raise RuntimeError("Input transformation still changing after "

583

"%d iterations. Aborting." % TRANSFORM_LOOP_LIMIT)

586

"%d iterations. Aborting." % TRANSFORM_LOOP_LIMIT)

584

587

585

def transform_cell(self, cell: str) -> str:

588

def transform_cell(self, cell: str) -> str:

586

"""Transforms a cell of input code"""

589

"""Transforms a cell of input code"""

587

if not cell.endswith('\n'):

590

if not cell.endswith('\n'):

588

cell += '\n' # Ensure the cell has a trailing newline

591

cell += '\n' # Ensure the cell has a trailing newline

589

lines = cell.splitlines(keepends=True)

592

lines = cell.splitlines(keepends=True)

590

for transform in self.cleanup_transforms + self.line_transforms:

593

for transform in self.cleanup_transforms + self.line_transforms:

591

lines = transform(lines)

594

lines = transform(lines)

592

595

593

lines = self.do_token_transforms(lines)

596

lines = self.do_token_transforms(lines)

594

return ''.join(lines)

597

return ''.join(lines)

595

598

596

def check_complete(self, cell: str):

599

def check_complete(self, cell: str):

597

"""Return whether a block of code is ready to execute, or should be continued

600

"""Return whether a block of code is ready to execute, or should be continued

598

601

599

Parameters

602

Parameters

600

----------

603

----------

601

source : string

604

source : string

602

Python input code, which can be multiline.

605

Python input code, which can be multiline.

603

606

604

Returns

607

Returns

605

-------

608

-------

606

status : str

609

status : str

607

One of 'complete', 'incomplete', or 'invalid' if source is not a

610

One of 'complete', 'incomplete', or 'invalid' if source is not a

608

prefix of valid code.

611

prefix of valid code.

609

indent_spaces : int or None

612

indent_spaces : int or None

610

The number of spaces by which to indent the next line of code. If

613

The number of spaces by which to indent the next line of code. If

611

status is not 'incomplete', this is None.

614

status is not 'incomplete', this is None.

612

"""

615

"""

613

# Remember if the lines ends in a new line.

616

# Remember if the lines ends in a new line.

614

ends_with_newline = False

617

ends_with_newline = False

615

for character in reversed(cell):

618

for character in reversed(cell):

616

if character == '\n':

619

if character == '\n':

617

ends_with_newline = True

620

ends_with_newline = True

618

break

621

break

619

elif character.strip():

622

elif character.strip():

620

break

623

break

621

else:

624

else:

622

continue

625

continue

623

626

624

if not ends_with_newline:

627

if not ends_with_newline:

625

# Append an newline for consistent tokenization

628

# Append an newline for consistent tokenization

626

# See https://bugs.python.org/issue33899

629

# See https://bugs.python.org/issue33899

627

cell += '\n'

630

cell += '\n'

628

631

629

lines = cell.splitlines(keepends=True)

632

lines = cell.splitlines(keepends=True)

630

633

631

if not lines:

634

if not lines:

632

return 'complete', None

635

return 'complete', None

633

636

634

if lines[-1].endswith('\\'):

637

if lines[-1].endswith('\\'):

635

# Explicit backslash continuation

638

# Explicit backslash continuation

636

return 'incomplete', find_last_indent(lines)

639

return 'incomplete', find_last_indent(lines)

637

640

638

try:

641

try:

639

for transform in self.cleanup_transforms:

642

for transform in self.cleanup_transforms:

640

if not getattr(transform, 'has_side_effects', False):

643

if not getattr(transform, 'has_side_effects', False):

641

lines = transform(lines)

644

lines = transform(lines)

642

except SyntaxError:

645

except SyntaxError:

643

return 'invalid', None

646

return 'invalid', None

644

647

645

if lines[0].startswith('%%'):

648

if lines[0].startswith('%%'):

646

# Special case for cell magics - completion marked by blank line

649

# Special case for cell magics - completion marked by blank line

647

if lines[-1].strip():

650

if lines[-1].strip():

648

return 'incomplete', find_last_indent(lines)

651

return 'incomplete', find_last_indent(lines)

649

else:

652

else:

650

return 'complete', None

653

return 'complete', None

651

654

652

try:

655

try:

653

for transform in self.line_transforms:

656

for transform in self.line_transforms:

654

if not getattr(transform, 'has_side_effects', False):

657

if not getattr(transform, 'has_side_effects', False):

655

lines = transform(lines)

658

lines = transform(lines)

656

lines = self.do_token_transforms(lines)

659

lines = self.do_token_transforms(lines)

657

except SyntaxError:

660

except SyntaxError:

658

return 'invalid', None

661

return 'invalid', None

659

662

660

tokens_by_line = make_tokens_by_line(lines)

663

tokens_by_line = make_tokens_by_line(lines)

661

664

662

if not tokens_by_line:

665

if not tokens_by_line:

663

return 'incomplete', find_last_indent(lines)

666

return 'incomplete', find_last_indent(lines)

664

667

665

if tokens_by_line[-1][-1].type != tokenize.ENDMARKER:

668

if tokens_by_line[-1][-1].type != tokenize.ENDMARKER:

666

# We're in a multiline string or expression

669

# We're in a multiline string or expression

667

return 'incomplete', find_last_indent(lines)

670

return 'incomplete', find_last_indent(lines)

668

671

669

newline_types = {tokenize.NEWLINE, tokenize.COMMENT, tokenize.ENDMARKER} # type: ignore

672

newline_types = {tokenize.NEWLINE, tokenize.COMMENT, tokenize.ENDMARKER} # type: ignore

670

673

671

# Pop the last line which only contains DEDENTs and ENDMARKER

674

# Pop the last line which only contains DEDENTs and ENDMARKER

672

last_token_line = None

675

last_token_line = None

673

if {t.type for t in tokens_by_line[-1]} in [

676

if {t.type for t in tokens_by_line[-1]} in [

674

{tokenize.DEDENT, tokenize.ENDMARKER},

677

{tokenize.DEDENT, tokenize.ENDMARKER},

675

{tokenize.ENDMARKER}

678

{tokenize.ENDMARKER}

676

] and len(tokens_by_line) > 1:

679

] and len(tokens_by_line) > 1:

677

last_token_line = tokens_by_line.pop()

680

last_token_line = tokens_by_line.pop()

678

681

679

while tokens_by_line[-1] and tokens_by_line[-1][-1].type in newline_types:

682

while tokens_by_line[-1] and tokens_by_line[-1][-1].type in newline_types:

680

tokens_by_line[-1].pop()

683

tokens_by_line[-1].pop()

681

684

682

if not tokens_by_line[-1]:

685

if not tokens_by_line[-1]:

683

return 'incomplete', find_last_indent(lines)

686

return 'incomplete', find_last_indent(lines)

684

687

685

if tokens_by_line[-1][-1].string == ':':

688

if tokens_by_line[-1][-1].string == ':':

686

# The last line starts a block (e.g. 'if foo:')

689

# The last line starts a block (e.g. 'if foo:')

687

ix = 0

690

ix = 0

688

while tokens_by_line[-1][ix].type in {tokenize.INDENT, tokenize.DEDENT}:

691

while tokens_by_line[-1][ix].type in {tokenize.INDENT, tokenize.DEDENT}:

689

ix += 1

692

ix += 1

690

693

691

indent = tokens_by_line[-1][ix].start[1]

694

indent = tokens_by_line[-1][ix].start[1]

692

return 'incomplete', indent + 4

695

return 'incomplete', indent + 4

693

696

694

if tokens_by_line[-1][0].line.endswith('\\'):

697

if tokens_by_line[-1][0].line.endswith('\\'):

695

return 'incomplete', None

698

return 'incomplete', None

696

699

697

# At this point, our checks think the code is complete (or invalid).

700

# At this point, our checks think the code is complete (or invalid).

698

# We'll use codeop.compile_command to check this with the real parser

701

# We'll use codeop.compile_command to check this with the real parser

699

try:

702

try:

700

with warnings.catch_warnings():

703

with warnings.catch_warnings():

701

warnings.simplefilter('error', SyntaxWarning)

704

warnings.simplefilter('error', SyntaxWarning)

702

res = compile_command(''.join(lines), symbol='exec')

705

res = compile_command(''.join(lines), symbol='exec')

703

except (SyntaxError, OverflowError, ValueError, TypeError,

706

except (SyntaxError, OverflowError, ValueError, TypeError,

704

MemoryError, SyntaxWarning):

707

MemoryError, SyntaxWarning):

705

return 'invalid', None

708

return 'invalid', None

706

else:

709

else:

707

if res is None:

710

if res is None:

708

return 'incomplete', find_last_indent(lines)

711

return 'incomplete', find_last_indent(lines)

709

712

710

if last_token_line and last_token_line[0].type == tokenize.DEDENT:

713

if last_token_line and last_token_line[0].type == tokenize.DEDENT:

711

if ends_with_newline:

714

if ends_with_newline:

712

return 'complete', None

715

return 'complete', None

713

return 'incomplete', find_last_indent(lines)

716

return 'incomplete', find_last_indent(lines)

714

717

715

# If there's a blank line at the end, assume we're ready to execute

718

# If there's a blank line at the end, assume we're ready to execute

716

if not lines[-1].strip():

719

if not lines[-1].strip():

717

return 'complete', None

720

return 'complete', None

718

721

719

return 'complete', None

722

return 'complete', None

720

723

721

724

722

def find_last_indent(lines):

725

def find_last_indent(lines):

723

m = _indent_re.match(lines[-1])

726

m = _indent_re.match(lines[-1])

724

if not m:

727

if not m:

725

return 0

728

return 0

726

return len(m.group(0).replace('\t', ' '*4))

729

return len(m.group(0).replace('\t', ' '*4))

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages

             """Input transformer machinery to support IPython special syntax.
             This includes the machinery to recognise and transform ``%magic`` commands,
             ``!system`` commands, ``help?`` querying, prompt stripping, and so forth.
             Added: IPython 7.0. Replaces inputsplitter and inputtransformer which were
             deprecated in 7.0.
             """
             # Copyright (c) IPython Development Team.
             # Distributed under the terms of the Modified BSD License.
             from codeop import compile_command
             import re
             import tokenize
             from typing import List, Tuple, Optional, Any
             import warnings
             _indent_re = re.compile(r'^[ \t]+')
             def leading_empty_lines(lines):
                 """Remove leading empty lines
                 If the leading lines are empty or contain only whitespace, they will be
                 removed.
                 """
                 if not lines:
                     return lines
                 for i, line in enumerate(lines):
                     if line and not line.isspace():
                         return lines[i:]
                 return lines
             def leading_indent(lines):
                 """Remove leading indentation.
                 If the first line starts with a spaces or tabs, the same whitespace will be
                 removed from each following line in the cell.
                 """
                 if not lines:
                     return lines
                 m = _indent_re.match(lines[0])
                 if not m:
                     return lines
                 space = m.group(0)
                 n = len(space)
                 return [l[n:] if l.startswith(space) else l
                         for l in lines]
             class PromptStripper:
                 """Remove matching input prompts from a block of input.
                 Parameters
                 ----------
                 prompt_re : regular expression
                     A regular expression matching any input prompt (including continuation,
                     e.g. ``...``)
                 initial_re : regular expression, optional
                     A regular expression matching only the initial prompt, but not continuation.
                     If no initial expression is given, prompt_re will be used everywhere.
                     Used mainly for plain Python prompts (``>>>``), where the continuation prompt
                     ``...`` is a valid Python expression in Python 3, so shouldn't be stripped.
+                Notes
+                -----
                 If initial_re and prompt_re differ,
                 only initial_re will be tested against the first line.
                 If any prompt is found on the first two lines,
                 prompts will be stripped from the rest of the block.
                 """
                 def __init__(self, prompt_re, initial_re=None):
                     self.prompt_re = prompt_re
                     self.initial_re = initial_re or prompt_re
                 def _strip(self, lines):
                     return [self.prompt_re.sub('', l, count=1) for l in lines]
                 def __call__(self, lines):
                     if not lines:
                         return lines
                     if self.initial_re.match(lines[0]) or \
                             (len(lines) > 1 and self.prompt_re.match(lines[1])):
                         return self._strip(lines)
                     return lines
             classic_prompt = PromptStripper(
                 prompt_re=re.compile(r'^(>>>|\.\.\.)( |$)'),
                 initial_re=re.compile(r'^>>>( |$)')
             )
             ipython_prompt = PromptStripper(re.compile(r'^(In \[\d+\]: |\s*\.{3,}: ?)'))
             def cell_magic(lines):
                 if not lines or not lines[0].startswith('%%'):
                     return lines
                 if re.match(r'%%\w+\?', lines[0]):
                     # This case will be handled by help_end
                     return lines
                 magic_name, _, first_line = lines[0][2:].rstrip().partition(' ')
                 body = ''.join(lines[1:])
                 return ['get_ipython().run_cell_magic(%r, %r, %r)\n'
                         % (magic_name, first_line, body)]
             def _find_assign_op(token_line) -> Optional[int]:
                 """Get the index of the first assignment in the line ('=' not inside brackets)
                 Note: We don't try to support multiple special assignment (a = b = %foo)
                 """
                 paren_level = 0
                 for i, ti in enumerate(token_line):
                     s = ti.string
                     if s == '=' and paren_level == 0:
                         return i
                     if s in {'(','[','{'}:
                         paren_level += 1
                     elif s in {')', ']', '}'}:
                         if paren_level > 0:
                             paren_level -= 1
                 return None
             def find_end_of_continued_line(lines, start_line: int):
                 """Find the last line of a line explicitly extended using backslashes.
                 Uses 0-indexed line numbers.
                 """
                 end_line = start_line
                 while lines[end_line].endswith('\\\n'):
                     end_line += 1
                     if end_line >= len(lines):
                         break
                 return end_line
             def assemble_continued_line(lines, start: Tuple[int, int], end_line: int):
                 r"""Assemble a single line from multiple continued line pieces
                 Continued lines are lines ending in ``\``, and the line following the last
                 ``\`` in the block.
                 For example, this code continues over multiple lines::
                     if (assign_ix is not None) \
                          and (len(line) >= assign_ix + 2) \
                          and (line[assign_ix+1].string == '%') \
                          and (line[assign_ix+2].type == tokenize.NAME):
                 This statement contains four continued line pieces.
                 Assembling these pieces into a single line would give::
                     if (assign_ix is not None) and (len(line) >= assign_ix + 2) and (line[...
                 This uses 0-indexed line numbers. *start* is (lineno, colno).
                 Used to allow ``%magic`` and ``!system`` commands to be continued over
                 multiple lines.
                 """
                 parts = [lines[start[0]][start[1]:]] + lines[start[0]+1:end_line+1]
                 return ' '.join([p.rstrip()[:-1] for p in parts[:-1]]  # Strip backslash+newline
                                 + [parts[-1].rstrip()])         # Strip newline from last line
             class TokenTransformBase:
                 """Base class for transformations which examine tokens.
                 Special syntax should not be transformed when it occurs inside strings or
                 comments. This is hard to reliably avoid with regexes. The solution is to
                 tokenise the code as Python, and recognise the special syntax in the tokens.
                 IPython's special syntax is not valid Python syntax, so tokenising may go
                 wrong after the special syntax starts. These classes therefore find and
                 transform *one* instance of special syntax at a time into regular Python
                 syntax. After each transformation, tokens are regenerated to find the next
                 piece of special syntax.
                 Subclasses need to implement one class method (find)
                 and one regular method (transform).
                 The priority attribute can select which transformation to apply if multiple
                 transformers match in the same place. Lower numbers have higher priority.
                 This allows "%magic?" to be turned into a help call rather than a magic call.
                 """
                 # Lower numbers -> higher priority (for matches in the same location)
                 priority = 10
                 def sortby(self):
                     return self.start_line, self.start_col, self.priority
                 def __init__(self, start):
                     self.start_line = start[0] - 1   # Shift from 1-index to 0-index
                     self.start_col = start[1]
                 @classmethod
                 def find(cls, tokens_by_line):
                     """Find one instance of special syntax in the provided tokens.
                     Tokens are grouped into logical lines for convenience,
                     so it is easy to e.g. look at the first token of each line.
                     *tokens_by_line* is a list of lists of tokenize.TokenInfo objects.
                     This should return an instance of its class, pointing to the start
                     position it has found, or None if it found no match.
                     """
                     raise NotImplementedError
                 def transform(self, lines: List[str]):
                     """Transform one instance of special syntax found by ``find()``
                     Takes a list of strings representing physical lines,
                     returns a similar list of transformed lines.
                     """
                     raise NotImplementedError
             class MagicAssign(TokenTransformBase):
                 """Transformer for assignments from magics (a = %foo)"""
                 @classmethod
                 def find(cls, tokens_by_line):
                     """Find the first magic assignment (a = %foo) in the cell.
                     """
                     for line in tokens_by_line:
                         assign_ix = _find_assign_op(line)
                         if (assign_ix is not None) \
                                 and (len(line) >= assign_ix + 2) \
                                 and (line[assign_ix+1].string == '%') \
                                 and (line[assign_ix+2].type == tokenize.NAME):
                             return cls(line[assign_ix+1].start)
                 def transform(self, lines: List[str]):
                     """Transform a magic assignment found by the ``find()`` classmethod.
                     """
                     start_line, start_col = self.start_line, self.start_col
                     lhs = lines[start_line][:start_col]
                     end_line = find_end_of_continued_line(lines, start_line)
                     rhs = assemble_continued_line(lines, (start_line, start_col), end_line)
                     assert rhs.startswith('%'), rhs
                     magic_name, _, args = rhs[1:].partition(' ')
                     lines_before = lines[:start_line]
                     call = "get_ipython().run_line_magic({!r}, {!r})".format(magic_name, args)
                     new_line = lhs + call + '\n'
                     lines_after = lines[end_line+1:]
                     return lines_before + [new_line] + lines_after
             class SystemAssign(TokenTransformBase):
                 """Transformer for assignments from system commands (a = !foo)"""
                 @classmethod
                 def find(cls, tokens_by_line):
                     """Find the first system assignment (a = !foo) in the cell.
                     """
                     for line in tokens_by_line:
                         assign_ix = _find_assign_op(line)
                         if (assign_ix is not None) \
                                 and not line[assign_ix].line.strip().startswith('=') \
                                 and (len(line) >= assign_ix + 2) \
                                 and (line[assign_ix + 1].type == tokenize.ERRORTOKEN):
                             ix = assign_ix + 1
                             while ix < len(line) and line[ix].type == tokenize.ERRORTOKEN:
                                 if line[ix].string == '!':
                                     return cls(line[ix].start)
                                 elif not line[ix].string.isspace():
                                     break
                                 ix += 1
                 def transform(self, lines: List[str]):
                     """Transform a system assignment found by the ``find()`` classmethod.
                     """
                     start_line, start_col = self.start_line, self.start_col
                     lhs = lines[start_line][:start_col]
                     end_line = find_end_of_continued_line(lines, start_line)
                     rhs = assemble_continued_line(lines, (start_line, start_col), end_line)
                     assert rhs.startswith('!'), rhs
                     cmd = rhs[1:]
                     lines_before = lines[:start_line]
                     call = "get_ipython().getoutput({!r})".format(cmd)
                     new_line = lhs + call + '\n'
                     lines_after = lines[end_line + 1:]
                     return lines_before + [new_line] + lines_after
             # The escape sequences that define the syntax transformations IPython will
             # apply to user input.  These can NOT be just changed here: many regular
             # expressions and other parts of the code may use their hardcoded values, and
             # for all intents and purposes they constitute the 'IPython syntax', so they
             # should be considered fixed.
             ESC_SHELL  = '!'     # Send line to underlying system shell
             ESC_SH_CAP = '!!'    # Send line to system shell and capture output
             ESC_HELP   = '?'     # Find information about object
             ESC_HELP2  = '??'    # Find extra-detailed information about object
             ESC_MAGIC  = '%'     # Call magic function
             ESC_MAGIC2 = '%%'    # Call cell-magic function
             ESC_QUOTE  = ','     # Split args on whitespace, quote each as string and call
             ESC_QUOTE2 = ';'     # Quote all args as a single string, call
             ESC_PAREN  = '/'     # Call first argument with rest of line as arguments
             ESCAPE_SINGLES = {'!', '?', '%', ',', ';', '/'}
             ESCAPE_DOUBLES = {'!!', '??'}  # %% (cell magic) is handled separately
             def _make_help_call(target, esc, next_input=None):
                 """Prepares a pinfo(2)/psearch call from a target name and the escape
                 (i.e. ? or ??)"""
                 method  = 'pinfo2' if esc == '??' \
                             else 'psearch' if '*' in target \
                             else 'pinfo'
                 arg = " ".join([method, target])
                 #Prepare arguments for get_ipython().run_line_magic(magic_name, magic_args)
                 t_magic_name, _, t_magic_arg_s = arg.partition(' ')
                 t_magic_name = t_magic_name.lstrip(ESC_MAGIC)
                 if next_input is None:
                     return 'get_ipython().run_line_magic(%r, %r)' % (t_magic_name, t_magic_arg_s)
                 else:
                     return 'get_ipython().set_next_input(%r);get_ipython().run_line_magic(%r, %r)' % \
                        (next_input, t_magic_name, t_magic_arg_s)
             def _tr_help(content):
                 """Translate lines escaped with: ?
                 A naked help line should fire the intro help screen (shell.show_usage())
                 """
                 if not content:
                     return 'get_ipython().show_usage()'
                 return _make_help_call(content, '?')
             def _tr_help2(content):
                 """Translate lines escaped with: ??
                 A naked help line should fire the intro help screen (shell.show_usage())
                 """
                 if not content:
                     return 'get_ipython().show_usage()'
                 return _make_help_call(content, '??')
             def _tr_magic(content):
                 "Translate lines escaped with a percent sign: %"
                 name, _, args = content.partition(' ')
                 return 'get_ipython().run_line_magic(%r, %r)' % (name, args)
             def _tr_quote(content):
                 "Translate lines escaped with a comma: ,"
                 name, _, args = content.partition(' ')
                 return '%s("%s")' % (name, '", "'.join(args.split()) )
             def _tr_quote2(content):
                 "Translate lines escaped with a semicolon: ;"
                 name, _, args = content.partition(' ')
                 return '%s("%s")' % (name, args)
             def _tr_paren(content):
                 "Translate lines escaped with a slash: /"
                 name, _, args = content.partition(' ')
                 return '%s(%s)' % (name, ", ".join(args.split()))
             tr = { ESC_SHELL  : 'get_ipython().system({!r})'.format,
                    ESC_SH_CAP : 'get_ipython().getoutput({!r})'.format,
                    ESC_HELP   : _tr_help,
                    ESC_HELP2  : _tr_help2,
                    ESC_MAGIC  : _tr_magic,
                    ESC_QUOTE  : _tr_quote,
                    ESC_QUOTE2 : _tr_quote2,
                    ESC_PAREN  : _tr_paren }
             class EscapedCommand(TokenTransformBase):
                 """Transformer for escaped commands like %foo, !foo, or /foo"""
                 @classmethod
                 def find(cls, tokens_by_line):
                     """Find the first escaped command (%foo, !foo, etc.) in the cell.
                     """
                     for line in tokens_by_line:
                         if not line:
                             continue
                         ix = 0
                         ll = len(line)
                         while ll > ix and line[ix].type in {tokenize.INDENT, tokenize.DEDENT}:
                             ix += 1
                         if ix >= ll:
                             continue
                         if line[ix].string in ESCAPE_SINGLES:
                             return cls(line[ix].start)
                 def transform(self, lines):
                     """Transform an escaped line found by the ``find()`` classmethod.
                     """
                     start_line, start_col = self.start_line, self.start_col
                     indent = lines[start_line][:start_col]
                     end_line = find_end_of_continued_line(lines, start_line)
                     line = assemble_continued_line(lines, (start_line, start_col), end_line)
                     if len(line) > 1 and line[:2] in ESCAPE_DOUBLES:
                         escape, content = line[:2], line[2:]
                     else:
                         escape, content = line[:1], line[1:]
                     if escape in tr:
                         call = tr[escape](content)
                     else:
                         call = ''
                     lines_before = lines[:start_line]
                     new_line = indent + call + '\n'
                     lines_after = lines[end_line + 1:]
                     return lines_before + [new_line] + lines_after
             _help_end_re = re.compile(r"""(%{0,2}
                                           (?!\d)[\w*]+            # Variable name
                                           (\.(?!\d)[\w*]+)*       # .etc.etc
                                           )
                                           (\?\??)$                # ? or ??
                                           """,
                                           re.VERBOSE)
             class HelpEnd(TokenTransformBase):
                 """Transformer for help syntax: obj? and obj??"""
                 # This needs to be higher priority (lower number) than EscapedCommand so
                 # that inspecting magics (%foo?) works.
                 priority = 5
                 def __init__(self, start, q_locn):
                     super().__init__(start)
                     self.q_line = q_locn[0] - 1  # Shift from 1-indexed to 0-indexed
                     self.q_col = q_locn[1]
                 @classmethod
                 def find(cls, tokens_by_line):
                     """Find the first help command (foo?) in the cell.
                     """
                     for line in tokens_by_line:
                         # Last token is NEWLINE; look at last but one
                         if len(line) > 2 and line[-2].string == '?':
                             # Find the first token that's not INDENT/DEDENT
                             ix = 0
                             while line[ix].type in {tokenize.INDENT, tokenize.DEDENT}:
                                 ix += 1
                             return cls(line[ix].start, line[-2].start)
                 def transform(self, lines):
                     """Transform a help command found by the ``find()`` classmethod.
                     """
                     piece = ''.join(lines[self.start_line:self.q_line+1])
                     indent, content = piece[:self.start_col], piece[self.start_col:]
                     lines_before = lines[:self.start_line]
                     lines_after = lines[self.q_line + 1:]
                     m = _help_end_re.search(content)
                     if not m:
                         raise SyntaxError(content)
                     assert m is not None, content
                     target = m.group(1)
                     esc = m.group(3)
                     # If we're mid-command, put it back on the next prompt for the user.
                     next_input = None
                     if (not lines_before) and (not lines_after) \
                             and content.strip() != m.group(0):
                         next_input = content.rstrip('?\n')
                     call = _make_help_call(target, esc, next_input=next_input)
                     new_line = indent + call + '\n'
                     return lines_before + [new_line] + lines_after
             def make_tokens_by_line(lines:List[str]):
                 """Tokenize a series of lines and group tokens by line.
                 The tokens for a multiline Python string or expression are grouped as one
                 line. All lines except the last lines should keep their line ending ('\\n',
                 '\\r\\n') for this to properly work. Use `.splitlines(keeplineending=True)`
                 for example when passing block of text to this function.
                 """
                 # NL tokens are used inside multiline expressions, but also after blank
                 # lines or comments. This is intentional - see https://bugs.python.org/issue17061
                 # We want to group the former case together but split the latter, so we
                 # track parentheses level, similar to the internals of tokenize.
                 #   reexported from token on 3.7+
                 NEWLINE, NL = tokenize.NEWLINE, tokenize.NL  # type: ignore
                 tokens_by_line:List[List[Any]] = [[]]
                 if len(lines) > 1 and not lines[0].endswith(('\n', '\r', '\r\n', '\x0b', '\x0c')):
                     warnings.warn("`make_tokens_by_line` received a list of lines which do not have lineending markers ('\\n', '\\r', '\\r\\n', '\\x0b', '\\x0c'), behavior will be unspecified")
                 parenlev = 0
                 try:
                     for token in tokenize.generate_tokens(iter(lines).__next__):
                         tokens_by_line[-1].append(token)
                         if (token.type == NEWLINE) \
                                 or ((token.type == NL) and (parenlev <= 0)):
                             tokens_by_line.append([])
                         elif token.string in {'(', '[', '{'}:
                             parenlev += 1
                         elif token.string in {')', ']', '}'}:
                             if parenlev > 0:
                                 parenlev -= 1
                 except tokenize.TokenError:
                     # Input ended in a multiline string or expression. That's OK for us.
                     pass
                 if not tokens_by_line[-1]:
                     tokens_by_line.pop()
                 return tokens_by_line
             def show_linewise_tokens(s: str):
                 """For investigation and debugging"""
                 if not s.endswith('\n'):
                     s += '\n'
                 lines = s.splitlines(keepends=True)
                 for line in make_tokens_by_line(lines):
                     print("Line -------")
                     for tokinfo in line:
                         print(" ", tokinfo)
             # Arbitrary limit to prevent getting stuck in infinite loops
             TRANSFORM_LOOP_LIMIT = 500
             class TransformerManager:
                 """Applies various transformations to a cell or code block.
                 The key methods for external use are ``transform_cell()``
                 and ``check_complete()``.
                 """
                 def __init__(self):
                     self.cleanup_transforms = [
                         leading_empty_lines,
                         leading_indent,
                         classic_prompt,
                         ipython_prompt,
                     ]
                     self.line_transforms = [
                         cell_magic,
                     ]
                     self.token_transformers = [
                         MagicAssign,
                         SystemAssign,
                         EscapedCommand,
                         HelpEnd,
                     ]
                 def do_one_token_transform(self, lines):
                     """Find and run the transform earliest in the code.
                     Returns (changed, lines).
                     This method is called repeatedly until changed is False, indicating
                     that all available transformations are complete.
                     The tokens following IPython special syntax might not be valid, so
                     the transformed code is retokenised every time to identify the next
                     piece of special syntax. Hopefully long code cells are mostly valid
                     Python, not using lots of IPython special syntax, so this shouldn't be
                     a performance issue.
                     """
                     tokens_by_line = make_tokens_by_line(lines)
                     candidates = []
                     for transformer_cls in self.token_transformers:
                         transformer = transformer_cls.find(tokens_by_line)
                         if transformer:
                             candidates.append(transformer)
                     if not candidates:
                         # Nothing to transform
                         return False, lines
                     ordered_transformers = sorted(candidates, key=TokenTransformBase.sortby)
                     for transformer in ordered_transformers:
                         try:
                             return True, transformer.transform(lines)
                         except SyntaxError:
                             pass
                     return False, lines
                 def do_token_transforms(self, lines):
                     for _ in range(TRANSFORM_LOOP_LIMIT):
                         changed, lines = self.do_one_token_transform(lines)
                         if not changed:
                             return lines
                     raise RuntimeError("Input transformation still changing after "
                                        "%d iterations. Aborting." % TRANSFORM_LOOP_LIMIT)
                 def transform_cell(self, cell: str) -> str:
                     """Transforms a cell of input code"""
                     if not cell.endswith('\n'):
                         cell += '\n'  # Ensure the cell has a trailing newline
                     lines = cell.splitlines(keepends=True)
                     for transform in self.cleanup_transforms + self.line_transforms:
                         lines = transform(lines)
                     lines = self.do_token_transforms(lines)
                     return ''.join(lines)
                 def check_complete(self, cell: str):
                     """Return whether a block of code is ready to execute, or should be continued
                     Parameters
                     ----------
                     source : string
                       Python input code, which can be multiline.
                     Returns
                     -------
                     status : str
                       One of 'complete', 'incomplete', or 'invalid' if source is not a
                       prefix of valid code.
                     indent_spaces : int or None
                       The number of spaces by which to indent the next line of code. If
                       status is not 'incomplete', this is None.
                     """
                     # Remember if the lines ends in a new line.
                     ends_with_newline = False
                     for character in reversed(cell):
                         if character == '\n':
                             ends_with_newline = True
                             break
                         elif character.strip():
                             break
                         else:
                             continue
                     if not ends_with_newline:
                         # Append an newline for consistent tokenization
                         # See https://bugs.python.org/issue33899
                         cell += '\n'
                     lines = cell.splitlines(keepends=True)
                     if not lines:
                         return 'complete', None
                     if lines[-1].endswith('\\'):
                         # Explicit backslash continuation
                         return 'incomplete', find_last_indent(lines)
                     try:
                         for transform in self.cleanup_transforms:
                             if not getattr(transform, 'has_side_effects', False):
                                 lines = transform(lines)
                     except SyntaxError:
                         return 'invalid', None
                     if lines[0].startswith('%%'):
                         # Special case for cell magics - completion marked by blank line
                         if lines[-1].strip():
                             return 'incomplete', find_last_indent(lines)
                         else:
                             return 'complete', None
                     try:
                         for transform in self.line_transforms:
                             if not getattr(transform, 'has_side_effects', False):
                                 lines = transform(lines)
                         lines = self.do_token_transforms(lines)
                     except SyntaxError:
                         return 'invalid', None
                     tokens_by_line = make_tokens_by_line(lines)
                     if not tokens_by_line:
                         return 'incomplete', find_last_indent(lines)
                     if tokens_by_line[-1][-1].type != tokenize.ENDMARKER:
                         # We're in a multiline string or expression
                         return 'incomplete', find_last_indent(lines)
                     newline_types = {tokenize.NEWLINE, tokenize.COMMENT, tokenize.ENDMARKER} # type: ignore
                     # Pop the last line which only contains DEDENTs and ENDMARKER
                     last_token_line = None
                     if {t.type for t in tokens_by_line[-1]} in [
                         {tokenize.DEDENT, tokenize.ENDMARKER},
                         {tokenize.ENDMARKER}
                     ] and len(tokens_by_line) > 1:
                         last_token_line = tokens_by_line.pop()
                     while tokens_by_line[-1] and tokens_by_line[-1][-1].type in newline_types:
                         tokens_by_line[-1].pop()
                     if not tokens_by_line[-1]:
                         return 'incomplete', find_last_indent(lines)
                     if tokens_by_line[-1][-1].string == ':':
                         # The last line starts a block (e.g. 'if foo:')
                         ix = 0
                         while tokens_by_line[-1][ix].type in {tokenize.INDENT, tokenize.DEDENT}:
                             ix += 1
                         indent = tokens_by_line[-1][ix].start[1]
                         return 'incomplete', indent + 4
                     if tokens_by_line[-1][0].line.endswith('\\'):
                         return 'incomplete', None
                     # At this point, our checks think the code is complete (or invalid).
                     # We'll use codeop.compile_command to check this with the real parser
                     try:
                         with warnings.catch_warnings():
                             warnings.simplefilter('error', SyntaxWarning)
                             res = compile_command(''.join(lines), symbol='exec')
                     except (SyntaxError, OverflowError, ValueError, TypeError,
                             MemoryError, SyntaxWarning):
                         return 'invalid', None
                     else:
                         if res is None:
                             return 'incomplete', find_last_indent(lines)
                     if last_token_line and last_token_line[0].type == tokenize.DEDENT:
                         if ends_with_newline:
                             return 'complete', None
                         return 'incomplete', find_last_indent(lines)
                     # If there's a blank line at the end, assume we're ready to execute
                     if not lines[-1].strip():
                         return 'complete', None
                     return 'complete', None
             def find_last_indent(lines):
                 m = _indent_re.match(lines[-1])
                 if not m:
                     return 0
                 return len(m.group(0).replace('\t', ' '*4))