upstream/ipython Commit - r26495:40a57d40

1

"""Input transformer machinery to support IPython special syntax.

1

"""Input transformer machinery to support IPython special syntax.

2

3

This includes the machinery to recognise and transform ``%magic`` commands,

3

This includes the machinery to recognise and transform ``%magic`` commands,

4

``!system`` commands, ``help?`` querying, prompt stripping, and so forth.

4

``!system`` commands, ``help?`` querying, prompt stripping, and so forth.

5

6

Added: IPython 7.0. Replaces inputsplitter and inputtransformer which were

6

Added: IPython 7.0. Replaces inputsplitter and inputtransformer which were

7

deprecated in 7.0.

7

deprecated in 7.0.

8

"""

8

"""

9

10

# Copyright (c) IPython Development Team.

10

# Copyright (c) IPython Development Team.

11

# Distributed under the terms of the Modified BSD License.

11

# Distributed under the terms of the Modified BSD License.

12

13

from codeop import compile_command

13

from codeop import compile_command

14

import re

14

import re

15

import tokenize

15

import tokenize

16

from typing import List, Tuple, Optional, Any

16

from typing import List, Tuple, Optional, Any

17

import warnings

17

import warnings

18

19

_indent_re = re.compile(r'^[ \t]+')

19

_indent_re = re.compile(r'^[ \t]+')

20

21

def leading_empty_lines(lines):

21

def leading_empty_lines(lines):

22

"""Remove leading empty lines

22

"""Remove leading empty lines

23

24

If the leading lines are empty or contain only whitespace, they will be

24

If the leading lines are empty or contain only whitespace, they will be

25

removed.

25

removed.

26

"""

26

"""

27

if not lines:

27

if not lines:

28

return lines

28

return lines

29

for i, line in enumerate(lines):

29

for i, line in enumerate(lines):

30

if line and not line.isspace():

30

if line and not line.isspace():

31

return lines[i:]

31

return lines[i:]

32

return lines

32

return lines

33

34

def leading_indent(lines):

34

def leading_indent(lines):

35

"""Remove leading indentation.

35

"""Remove leading indentation.

36

37

If the first line starts with a spaces or tabs, the same whitespace will be

37

If the first line starts with a spaces or tabs, the same whitespace will be

38

removed from each following line in the cell.

38

removed from each following line in the cell.

39

"""

39

"""

40

if not lines:

40

if not lines:

41

return lines

41

return lines

42

m = _indent_re.match(lines[0])

42

m = _indent_re.match(lines[0])

43

if not m:

43

if not m:

44

return lines

44

return lines

45

space = m.group(0)

45

space = m.group(0)

46

n = len(space)

46

n = len(space)

47

return [l[n:] if l.startswith(space) else l

47

return [l[n:] if l.startswith(space) else l

48

for l in lines]

48

for l in lines]

49

50

class PromptStripper:

50

class PromptStripper:

51

"""Remove matching input prompts from a block of input.

51

"""Remove matching input prompts from a block of input.

52

53

Parameters

53

Parameters

54

----------

54

----------

55

prompt_re : regular expression

55

prompt_re : regular expression

56

A regular expression matching any input prompt (including continuation,

56

A regular expression matching any input prompt (including continuation,

57

e.g. ``...``)

57

e.g. ``...``)

58

initial_re : regular expression, optional

58

initial_re : regular expression, optional

59

A regular expression matching only the initial prompt, but not continuation.

59

A regular expression matching only the initial prompt, but not continuation.

60

If no initial expression is given, prompt_re will be used everywhere.

60

If no initial expression is given, prompt_re will be used everywhere.

61

Used mainly for plain Python prompts (``>>>``), where the continuation prompt

61

Used mainly for plain Python prompts (``>>>``), where the continuation prompt

62

``...`` is a valid Python expression in Python 3, so shouldn't be stripped.

62

``...`` is a valid Python expression in Python 3, so shouldn't be stripped.

63

64

Notes

64

Notes

65

-----

65

-----

66

67

If initial_re and prompt_re differ,

67

If initial_re and prompt_re differ,

68

only initial_re will be tested against the first line.

68

only initial_re will be tested against the first line.

69

If any prompt is found on the first two lines,

69

If any prompt is found on the first two lines,

70

prompts will be stripped from the rest of the block.

70

prompts will be stripped from the rest of the block.

71

"""

71

"""

72

def __init__(self, prompt_re, initial_re=None):

72

def __init__(self, prompt_re, initial_re=None):

73

self.prompt_re = prompt_re

73

self.prompt_re = prompt_re

74

self.initial_re = initial_re or prompt_re

74

self.initial_re = initial_re or prompt_re

75

76

def _strip(self, lines):

76

def _strip(self, lines):

77

return [self.prompt_re.sub('', l, count=1) for l in lines]

77

return [self.prompt_re.sub('', l, count=1) for l in lines]

78

79

def __call__(self, lines):

79

def __call__(self, lines):

80

if not lines:

80

if not lines:

81

return lines

81

return lines

82

if self.initial_re.match(lines[0]) or \

82

if self.initial_re.match(lines[0]) or \

83

(len(lines) > 1 and self.prompt_re.match(lines[1])):

83

(len(lines) > 1 and self.prompt_re.match(lines[1])):

84

return self._strip(lines)

84

return self._strip(lines)

85

return lines

85

return lines

86

87

classic_prompt = PromptStripper(

87

classic_prompt = PromptStripper(

88

prompt_re=re.compile(r'^(>>>|\.\.\.)( |$)'),

88

prompt_re=re.compile(r'^(>>>|\.\.\.)( |$)'),

89

initial_re=re.compile(r'^>>>( |$)')

89

initial_re=re.compile(r'^>>>( |$)')

90

)

90

)

91

92

ipython_prompt = PromptStripper(

92

ipython_prompt = PromptStripper(

93

re.compile(

93

re.compile(

94

r"""

94

r"""

95

^( # Match from the beginning of a line, either:

95

^( # Match from the beginning of a line, either:

96

97

# 1. First-line prompt:

97

# 1. First-line prompt:

98

((\[nav\]|\[ins\])?\ )? # Vi editing mode prompt, if it's there

98

((\[nav\]|\[ins\])?\ )? # Vi editing mode prompt, if it's there

99

In\ # The 'In' of the prompt, with a space

99

In\ # The 'In' of the prompt, with a space

100

\[\d+\]: # Command index, as displayed in the prompt

100

\[\d+\]: # Command index, as displayed in the prompt

101

\ # With a mandatory trailing space

101

\ # With a mandatory trailing space

102

103

| # ... or ...

103

| # ... or ...

104

105

# 2. The three dots of the multiline prompt

105

# 2. The three dots of the multiline prompt

106

\s* # All leading whitespace characters

106

\s* # All leading whitespace characters

107

\.{3,}: # The three (or more) dots

107

\.{3,}: # The three (or more) dots

108

\ ? # With an optional trailing space

108

\ ? # With an optional trailing space

109

110

)

110

)

111

""",

111

""",

112

re.VERBOSE,

112

re.VERBOSE,

113

)

113

)

114

)

114

)

115

116

117

def cell_magic(lines):

117

def cell_magic(lines):

118

if not lines or not lines[0].startswith('%%'):

118

if not lines or not lines[0].startswith('%%'):

119

return lines

119

return lines

120

if re.match(r'%%\w+\?', lines[0]):

120

if re.match(r'%%\w+\?', lines[0]):

121

# This case will be handled by help_end

121

# This case will be handled by help_end

122

return lines

122

return lines

123

magic_name, _, first_line = lines[0][2:].rstrip().partition(' ')

123

magic_name, _, first_line = lines[0][2:].rstrip().partition(' ')

124

body = ''.join(lines[1:])

124

body = ''.join(lines[1:])

125

return ['get_ipython().run_cell_magic(%r, %r, %r)\n'

125

return ['get_ipython().run_cell_magic(%r, %r, %r)\n'

126

% (magic_name, first_line, body)]

126

% (magic_name, first_line, body)]

127

128

129

def _find_assign_op(token_line) -> Optional[int]:

129

def _find_assign_op(token_line) -> Optional[int]:

130

"""Get the index of the first assignment in the line ('=' not inside brackets)

130

"""Get the index of the first assignment in the line ('=' not inside brackets)

131

132

Note: We don't try to support multiple special assignment (a = b = %foo)

132

Note: We don't try to support multiple special assignment (a = b = %foo)

133

"""

133

"""

134

paren_level = 0

134

paren_level = 0

135

for i, ti in enumerate(token_line):

135

for i, ti in enumerate(token_line):

136

s = ti.string

136

s = ti.string

137

if s == '=' and paren_level == 0:

137

if s == '=' and paren_level == 0:

138

return i

138

return i

139

if s in {'(','[','{'}:

139

if s in {'(','[','{'}:

140

paren_level += 1

140

paren_level += 1

141

elif s in {')', ']', '}'}:

141

elif s in {')', ']', '}'}:

142

if paren_level > 0:

142

if paren_level > 0:

143

paren_level -= 1

143

paren_level -= 1

144

return None

144

return None

145

146

def find_end_of_continued_line(lines, start_line: int):

146

def find_end_of_continued_line(lines, start_line: int):

147

"""Find the last line of a line explicitly extended using backslashes.

147

"""Find the last line of a line explicitly extended using backslashes.

148

149

Uses 0-indexed line numbers.

149

Uses 0-indexed line numbers.

150

"""

150

"""

151

end_line = start_line

151

end_line = start_line

152

while lines[end_line].endswith('\\\n'):

152

while lines[end_line].endswith('\\\n'):

153

end_line += 1

153

end_line += 1

154

if end_line >= len(lines):

154

if end_line >= len(lines):

155

break

155

break

156

return end_line

156

return end_line

157

158

def assemble_continued_line(lines, start: Tuple[int, int], end_line: int):

158

def assemble_continued_line(lines, start: Tuple[int, int], end_line: int):

159

r"""Assemble a single line from multiple continued line pieces

159

r"""Assemble a single line from multiple continued line pieces

160

161

Continued lines are lines ending in ``\``, and the line following the last

161

Continued lines are lines ending in ``\``, and the line following the last

162

``\`` in the block.

162

``\`` in the block.

163

164

For example, this code continues over multiple lines::

164

For example, this code continues over multiple lines::

165

166

if (assign_ix is not None) \

166

if (assign_ix is not None) \

167

and (len(line) >= assign_ix + 2) \

167

and (len(line) >= assign_ix + 2) \

168

and (line[assign_ix+1].string == '%') \

168

and (line[assign_ix+1].string == '%') \

169

and (line[assign_ix+2].type == tokenize.NAME):

169

and (line[assign_ix+2].type == tokenize.NAME):

170

171

This statement contains four continued line pieces.

171

This statement contains four continued line pieces.

172

Assembling these pieces into a single line would give::

172

Assembling these pieces into a single line would give::

173

174

if (assign_ix is not None) and (len(line) >= assign_ix + 2) and (line[...

174

if (assign_ix is not None) and (len(line) >= assign_ix + 2) and (line[...

175

176

This uses 0-indexed line numbers. *start* is (lineno, colno).

176

This uses 0-indexed line numbers. *start* is (lineno, colno).

177

178

Used to allow ``%magic`` and ``!system`` commands to be continued over

178

Used to allow ``%magic`` and ``!system`` commands to be continued over

179

multiple lines.

179

multiple lines.

180

"""

180

"""

181

parts = [lines[start[0]][start[1]:]] + lines[start[0]+1:end_line+1]

181

parts = [lines[start[0]][start[1]:]] + lines[start[0]+1:end_line+1]

182

return ' '.join([p.rstrip()[:-1] for p in parts[:-1]] # Strip backslash+newline

182

return ' '.join([p.rstrip()[:-1] for p in parts[:-1]] # Strip backslash+newline

183

+ [parts[-1].rstrip()]) # Strip newline from last line

183

+ [parts[-1].rstrip()]) # Strip newline from last line

184

185

class TokenTransformBase:

185

class TokenTransformBase:

186

"""Base class for transformations which examine tokens.

186

"""Base class for transformations which examine tokens.

187

188

Special syntax should not be transformed when it occurs inside strings or

188

Special syntax should not be transformed when it occurs inside strings or

189

comments. This is hard to reliably avoid with regexes. The solution is to

189

comments. This is hard to reliably avoid with regexes. The solution is to

190

tokenise the code as Python, and recognise the special syntax in the tokens.

190

tokenise the code as Python, and recognise the special syntax in the tokens.

191

192

IPython's special syntax is not valid Python syntax, so tokenising may go

192

IPython's special syntax is not valid Python syntax, so tokenising may go

193

wrong after the special syntax starts. These classes therefore find and

193

wrong after the special syntax starts. These classes therefore find and

194

transform *one* instance of special syntax at a time into regular Python

194

transform *one* instance of special syntax at a time into regular Python

195

syntax. After each transformation, tokens are regenerated to find the next

195

syntax. After each transformation, tokens are regenerated to find the next

196

piece of special syntax.

196

piece of special syntax.

197

198

Subclasses need to implement one class method (find)

198

Subclasses need to implement one class method (find)

199

and one regular method (transform).

199

and one regular method (transform).

200

201

The priority attribute can select which transformation to apply if multiple

201

The priority attribute can select which transformation to apply if multiple

202

transformers match in the same place. Lower numbers have higher priority.

202

transformers match in the same place. Lower numbers have higher priority.

203

This allows "%magic?" to be turned into a help call rather than a magic call.

203

This allows "%magic?" to be turned into a help call rather than a magic call.

204

"""

204

"""

205

# Lower numbers -> higher priority (for matches in the same location)

205

# Lower numbers -> higher priority (for matches in the same location)

206

priority = 10

206

priority = 10

207

208

def sortby(self):

208

def sortby(self):

209

return self.start_line, self.start_col, self.priority

209

return self.start_line, self.start_col, self.priority

210

211

def __init__(self, start):

211

def __init__(self, start):

212

self.start_line = start[0] - 1 # Shift from 1-index to 0-index

212

self.start_line = start[0] - 1 # Shift from 1-index to 0-index

213

self.start_col = start[1]

213

self.start_col = start[1]

214

215

@classmethod

215

@classmethod

216

def find(cls, tokens_by_line):

216

def find(cls, tokens_by_line):

217

"""Find one instance of special syntax in the provided tokens.

217

"""Find one instance of special syntax in the provided tokens.

218

219

Tokens are grouped into logical lines for convenience,

219

Tokens are grouped into logical lines for convenience,

220

so it is easy to e.g. look at the first token of each line.

220

so it is easy to e.g. look at the first token of each line.

221

*tokens_by_line* is a list of lists of tokenize.TokenInfo objects.

221

*tokens_by_line* is a list of lists of tokenize.TokenInfo objects.

222

223

This should return an instance of its class, pointing to the start

223

This should return an instance of its class, pointing to the start

224

position it has found, or None if it found no match.

224

position it has found, or None if it found no match.

225

"""

225

"""

226

raise NotImplementedError

226

raise NotImplementedError

227

228

def transform(self, lines: List[str]):

228

def transform(self, lines: List[str]):

229

"""Transform one instance of special syntax found by ``find()``

229

"""Transform one instance of special syntax found by ``find()``

230

231

Takes a list of strings representing physical lines,

231

Takes a list of strings representing physical lines,

232

returns a similar list of transformed lines.

232

returns a similar list of transformed lines.

233

"""

233

"""

234

raise NotImplementedError

234

raise NotImplementedError

235

236

class MagicAssign(TokenTransformBase):

236

class MagicAssign(TokenTransformBase):

237

"""Transformer for assignments from magics (a = %foo)"""

237

"""Transformer for assignments from magics (a = %foo)"""

238

@classmethod

238

@classmethod

239

def find(cls, tokens_by_line):

239

def find(cls, tokens_by_line):

240

"""Find the first magic assignment (a = %foo) in the cell.

240

"""Find the first magic assignment (a = %foo) in the cell.

241

"""

241

"""

242

for line in tokens_by_line:

242

for line in tokens_by_line:

243

assign_ix = _find_assign_op(line)

243

assign_ix = _find_assign_op(line)

244

if (assign_ix is not None) \

244

if (assign_ix is not None) \

245

and (len(line) >= assign_ix + 2) \

245

and (len(line) >= assign_ix + 2) \

246

and (line[assign_ix+1].string == '%') \

246

and (line[assign_ix+1].string == '%') \

247

and (line[assign_ix+2].type == tokenize.NAME):

247

and (line[assign_ix+2].type == tokenize.NAME):

248

return cls(line[assign_ix+1].start)

248

return cls(line[assign_ix+1].start)

249

250

def transform(self, lines: List[str]):

250

def transform(self, lines: List[str]):

251

"""Transform a magic assignment found by the ``find()`` classmethod.

251

"""Transform a magic assignment found by the ``find()`` classmethod.

252

"""

252

"""

253

start_line, start_col = self.start_line, self.start_col

253

start_line, start_col = self.start_line, self.start_col

254

lhs = lines[start_line][:start_col]

254

lhs = lines[start_line][:start_col]

255

end_line = find_end_of_continued_line(lines, start_line)

255

end_line = find_end_of_continued_line(lines, start_line)

256

rhs = assemble_continued_line(lines, (start_line, start_col), end_line)

256

rhs = assemble_continued_line(lines, (start_line, start_col), end_line)

257

assert rhs.startswith('%'), rhs

257

assert rhs.startswith('%'), rhs

258

magic_name, _, args = rhs[1:].partition(' ')

258

magic_name, _, args = rhs[1:].partition(' ')

259

260

lines_before = lines[:start_line]

260

lines_before = lines[:start_line]

261

call = "get_ipython().run_line_magic({!r}, {!r})".format(magic_name, args)

261

call = "get_ipython().run_line_magic({!r}, {!r})".format(magic_name, args)

262

new_line = lhs + call + '\n'

262

new_line = lhs + call + '\n'

263

lines_after = lines[end_line+1:]

263

lines_after = lines[end_line+1:]

264

265

return lines_before + [new_line] + lines_after

265

return lines_before + [new_line] + lines_after

266

267

268

class SystemAssign(TokenTransformBase):

268

class SystemAssign(TokenTransformBase):

269

"""Transformer for assignments from system commands (a = !foo)"""

269

"""Transformer for assignments from system commands (a = !foo)"""

270

@classmethod

270

@classmethod

271

def find(cls, tokens_by_line):

271

def find(cls, tokens_by_line):

272

"""Find the first system assignment (a = !foo) in the cell.

272

"""Find the first system assignment (a = !foo) in the cell.

273

"""

273

"""

274

for line in tokens_by_line:

274

for line in tokens_by_line:

275

assign_ix = _find_assign_op(line)

275

assign_ix = _find_assign_op(line)

276

if (assign_ix is not None) \

276

if (assign_ix is not None) \

277

and not line[assign_ix].line.strip().startswith('=') \

277

and not line[assign_ix].line.strip().startswith('=') \

278

and (len(line) >= assign_ix + 2) \

278

and (len(line) >= assign_ix + 2) \

279

and (line[assign_ix + 1].type == tokenize.ERRORTOKEN):

279

and (line[assign_ix + 1].type == tokenize.ERRORTOKEN):

280

ix = assign_ix + 1

280

ix = assign_ix + 1

281

282

while ix < len(line) and line[ix].type == tokenize.ERRORTOKEN:

282

while ix < len(line) and line[ix].type == tokenize.ERRORTOKEN:

283

if line[ix].string == '!':

283

if line[ix].string == '!':

284

return cls(line[ix].start)

284

return cls(line[ix].start)

285

elif not line[ix].string.isspace():

285

elif not line[ix].string.isspace():

286

break

286

break

287

ix += 1

287

ix += 1

288

289

def transform(self, lines: List[str]):

289

def transform(self, lines: List[str]):

290

"""Transform a system assignment found by the ``find()`` classmethod.

290

"""Transform a system assignment found by the ``find()`` classmethod.

291

"""

291

"""

292

start_line, start_col = self.start_line, self.start_col

292

start_line, start_col = self.start_line, self.start_col

293

294

lhs = lines[start_line][:start_col]

294

lhs = lines[start_line][:start_col]

295

end_line = find_end_of_continued_line(lines, start_line)

295

end_line = find_end_of_continued_line(lines, start_line)

296

rhs = assemble_continued_line(lines, (start_line, start_col), end_line)

296

rhs = assemble_continued_line(lines, (start_line, start_col), end_line)

297

assert rhs.startswith('!'), rhs

297

assert rhs.startswith('!'), rhs

298

cmd = rhs[1:]

298

cmd = rhs[1:]

299

300

lines_before = lines[:start_line]

300

lines_before = lines[:start_line]

301

call = "get_ipython().getoutput({!r})".format(cmd)

301

call = "get_ipython().getoutput({!r})".format(cmd)

302

new_line = lhs + call + '\n'

302

new_line = lhs + call + '\n'

303

lines_after = lines[end_line + 1:]

303

lines_after = lines[end_line + 1:]

304

305

return lines_before + [new_line] + lines_after

305

return lines_before + [new_line] + lines_after

306

307

# The escape sequences that define the syntax transformations IPython will

307

# The escape sequences that define the syntax transformations IPython will

308

# apply to user input. These can NOT be just changed here: many regular

308

# apply to user input. These can NOT be just changed here: many regular

309

# expressions and other parts of the code may use their hardcoded values, and

309

# expressions and other parts of the code may use their hardcoded values, and

310

# for all intents and purposes they constitute the 'IPython syntax', so they

310

# for all intents and purposes they constitute the 'IPython syntax', so they

311

# should be considered fixed.

311

# should be considered fixed.

312

313

ESC_SHELL = '!' # Send line to underlying system shell

313

ESC_SHELL = '!' # Send line to underlying system shell

314

ESC_SH_CAP = '!!' # Send line to system shell and capture output

314

ESC_SH_CAP = '!!' # Send line to system shell and capture output

315

ESC_HELP = '?' # Find information about object

315

ESC_HELP = '?' # Find information about object

316

ESC_HELP2 = '??' # Find extra-detailed information about object

316

ESC_HELP2 = '??' # Find extra-detailed information about object

317

ESC_MAGIC = '%' # Call magic function

317

ESC_MAGIC = '%' # Call magic function

318

ESC_MAGIC2 = '%%' # Call cell-magic function

318

ESC_MAGIC2 = '%%' # Call cell-magic function

319

ESC_QUOTE = ',' # Split args on whitespace, quote each as string and call

319

ESC_QUOTE = ',' # Split args on whitespace, quote each as string and call

320

ESC_QUOTE2 = ';' # Quote all args as a single string, call

320

ESC_QUOTE2 = ';' # Quote all args as a single string, call

321

ESC_PAREN = '/' # Call first argument with rest of line as arguments

321

ESC_PAREN = '/' # Call first argument with rest of line as arguments

322

323

ESCAPE_SINGLES = {'!', '?', '%', ',', ';', '/'}

323

ESCAPE_SINGLES = {'!', '?', '%', ',', ';', '/'}

324

ESCAPE_DOUBLES = {'!!', '??'} # %% (cell magic) is handled separately

324

ESCAPE_DOUBLES = {'!!', '??'} # %% (cell magic) is handled separately

325

326

def _make_help_call(target, esc, next_input=None):

326

def _make_help_call(target, esc, next_input=None):

327

"""Prepares a pinfo(2)/psearch call from a target name and the escape

327

"""Prepares a pinfo(2)/psearch call from a target name and the escape

328

(i.e. ? or ??)"""

328

(i.e. ? or ??)"""

329

method = 'pinfo2' if esc == '??' \

329

method = 'pinfo2' if esc == '??' \

330

else 'psearch' if '*' in target \

330

else 'psearch' if '*' in target \

331

else 'pinfo'

331

else 'pinfo'

332

arg = " ".join([method, target])

332

arg = " ".join([method, target])

333

#Prepare arguments for get_ipython().run_line_magic(magic_name, magic_args)

333

#Prepare arguments for get_ipython().run_line_magic(magic_name, magic_args)

334

t_magic_name, _, t_magic_arg_s = arg.partition(' ')

334

t_magic_name, _, t_magic_arg_s = arg.partition(' ')

335

t_magic_name = t_magic_name.lstrip(ESC_MAGIC)

335

t_magic_name = t_magic_name.lstrip(ESC_MAGIC)

336

if next_input is None:

336

if next_input is None:

337

return 'get_ipython().run_line_magic(%r, %r)' % (t_magic_name, t_magic_arg_s)

337

return 'get_ipython().run_line_magic(%r, %r)' % (t_magic_name, t_magic_arg_s)

338

else:

338

else:

339

return 'get_ipython().set_next_input(%r);get_ipython().run_line_magic(%r, %r)' % \

339

return 'get_ipython().set_next_input(%r);get_ipython().run_line_magic(%r, %r)' % \

340

(next_input, t_magic_name, t_magic_arg_s)

340

(next_input, t_magic_name, t_magic_arg_s)

341

342

def _tr_help(content):

342

def _tr_help(content):

343

"""Translate lines escaped with: ?

343

"""Translate lines escaped with: ?

344

345

A naked help line should fire the intro help screen (shell.show_usage())

345

A naked help line should fire the intro help screen (shell.show_usage())

346

"""

346

"""

347

if not content:

347

if not content:

348

return 'get_ipython().show_usage()'

348

return 'get_ipython().show_usage()'

349

350

return _make_help_call(content, '?')

350

return _make_help_call(content, '?')

351

352

def _tr_help2(content):

352

def _tr_help2(content):

353

"""Translate lines escaped with: ??

353

"""Translate lines escaped with: ??

354

355

A naked help line should fire the intro help screen (shell.show_usage())

355

A naked help line should fire the intro help screen (shell.show_usage())

356

"""

356

"""

357

if not content:

357

if not content:

358

return 'get_ipython().show_usage()'

358

return 'get_ipython().show_usage()'

359

360

return _make_help_call(content, '??')

360

return _make_help_call(content, '??')

361

362

def _tr_magic(content):

362

def _tr_magic(content):

363

"Translate lines escaped with a percent sign: %"

363

"Translate lines escaped with a percent sign: %"

364

name, _, args = content.partition(' ')

364

name, _, args = content.partition(' ')

365

return 'get_ipython().run_line_magic(%r, %r)' % (name, args)

365

return 'get_ipython().run_line_magic(%r, %r)' % (name, args)

366

367

def _tr_quote(content):

367

def _tr_quote(content):

368

"Translate lines escaped with a comma: ,"

368

"Translate lines escaped with a comma: ,"

369

name, _, args = content.partition(' ')

369

name, _, args = content.partition(' ')

370

return '%s("%s")' % (name, '", "'.join(args.split()) )

370

return '%s("%s")' % (name, '", "'.join(args.split()) )

371

372

def _tr_quote2(content):

372

def _tr_quote2(content):

373

"Translate lines escaped with a semicolon: ;"

373

"Translate lines escaped with a semicolon: ;"

374

name, _, args = content.partition(' ')

374

name, _, args = content.partition(' ')

375

return '%s("%s")' % (name, args)

375

return '%s("%s")' % (name, args)

376

377

def _tr_paren(content):

377

def _tr_paren(content):

378

"Translate lines escaped with a slash: /"

378

"Translate lines escaped with a slash: /"

379

name, _, args = content.partition(' ')

379

name, _, args = content.partition(' ')

380

return '%s(%s)' % (name, ", ".join(args.split()))

380

return '%s(%s)' % (name, ", ".join(args.split()))

381

382

tr = { ESC_SHELL : 'get_ipython().system({!r})'.format,

382

tr = { ESC_SHELL : 'get_ipython().system({!r})'.format,

383

ESC_SH_CAP : 'get_ipython().getoutput({!r})'.format,

383

ESC_SH_CAP : 'get_ipython().getoutput({!r})'.format,

384

ESC_HELP : _tr_help,

384

ESC_HELP : _tr_help,

385

ESC_HELP2 : _tr_help2,

385

ESC_HELP2 : _tr_help2,

386

ESC_MAGIC : _tr_magic,

386

ESC_MAGIC : _tr_magic,

387

ESC_QUOTE : _tr_quote,

387

ESC_QUOTE : _tr_quote,

388

ESC_QUOTE2 : _tr_quote2,

388

ESC_QUOTE2 : _tr_quote2,

389

ESC_PAREN : _tr_paren }

389

ESC_PAREN : _tr_paren }

390

391

class EscapedCommand(TokenTransformBase):

391

class EscapedCommand(TokenTransformBase):

392

"""Transformer for escaped commands like %foo, !foo, or /foo"""

392

"""Transformer for escaped commands like %foo, !foo, or /foo"""

393

@classmethod

393

@classmethod

394

def find(cls, tokens_by_line):

394

def find(cls, tokens_by_line):

395

"""Find the first escaped command (%foo, !foo, etc.) in the cell.

395

"""Find the first escaped command (%foo, !foo, etc.) in the cell.

396

"""

396

"""

397

for line in tokens_by_line:

397

for line in tokens_by_line:

398

if not line:

398

if not line:

399

continue

399

continue

400

ix = 0

400

ix = 0

401

ll = len(line)

401

ll = len(line)

402

while ll > ix and line[ix].type in {tokenize.INDENT, tokenize.DEDENT}:

402

while ll > ix and line[ix].type in {tokenize.INDENT, tokenize.DEDENT}:

403

ix += 1

403

ix += 1

404

if ix >= ll:

404

if ix >= ll:

405

continue

405

continue

406

if line[ix].string in ESCAPE_SINGLES:

406

if line[ix].string in ESCAPE_SINGLES:

407

return cls(line[ix].start)

407

return cls(line[ix].start)

408

409

def transform(self, lines):

409

def transform(self, lines):

410

"""Transform an escaped line found by the ``find()`` classmethod.

410

"""Transform an escaped line found by the ``find()`` classmethod.

411

"""

411

"""

412

start_line, start_col = self.start_line, self.start_col

412

start_line, start_col = self.start_line, self.start_col

413

414

indent = lines[start_line][:start_col]

414

indent = lines[start_line][:start_col]

415

end_line = find_end_of_continued_line(lines, start_line)

415

end_line = find_end_of_continued_line(lines, start_line)

416

line = assemble_continued_line(lines, (start_line, start_col), end_line)

416

line = assemble_continued_line(lines, (start_line, start_col), end_line)

417

418

if len(line) > 1 and line[:2] in ESCAPE_DOUBLES:

418

if len(line) > 1 and line[:2] in ESCAPE_DOUBLES:

419

escape, content = line[:2], line[2:]

419

escape, content = line[:2], line[2:]

420

else:

420

else:

421

escape, content = line[:1], line[1:]

421

escape, content = line[:1], line[1:]

422

423

if escape in tr:

423

if escape in tr:

424

call = tr[escape](content)

424

call = tr[escape](content)

425

else:

425

else:

426

call = ''

426

call = ''

427

428

lines_before = lines[:start_line]

428

lines_before = lines[:start_line]

429

new_line = indent + call + '\n'

429

new_line = indent + call + '\n'

430

lines_after = lines[end_line + 1:]

430

lines_after = lines[end_line + 1:]

431

432

return lines_before + [new_line] + lines_after

432

return lines_before + [new_line] + lines_after

433

434

_help_end_re = re.compile(r"""(%{0,2}

434

_help_end_re = re.compile(r"""(%{0,2}

435

(?!\d)[\w*]+ # Variable name

435

(?!\d)[\w*]+ # Variable name

436

(\.(?!\d)[\w*]+)* # .etc.etc

436

(\.(?!\d)[\w*]+)* # .etc.etc

437

)

437

)

438

(\?\??)$ # ? or ??

438

(\?\??)$ # ? or ??

439

""",

439

""",

440

re.VERBOSE)

440

re.VERBOSE)

441

442

class HelpEnd(TokenTransformBase):

442

class HelpEnd(TokenTransformBase):

443

"""Transformer for help syntax: obj? and obj??"""

443

"""Transformer for help syntax: obj? and obj??"""

444

# This needs to be higher priority (lower number) than EscapedCommand so

444

# This needs to be higher priority (lower number) than EscapedCommand so

445

# that inspecting magics (%foo?) works.

445

# that inspecting magics (%foo?) works.

446

priority = 5

446

priority = 5

447

448

def __init__(self, start, q_locn):

448

def __init__(self, start, q_locn):

449

super().__init__(start)

449

super().__init__(start)

450

self.q_line = q_locn[0] - 1 # Shift from 1-indexed to 0-indexed

450

self.q_line = q_locn[0] - 1 # Shift from 1-indexed to 0-indexed

451

self.q_col = q_locn[1]

451

self.q_col = q_locn[1]

452

453

@classmethod

453

@classmethod

454

def find(cls, tokens_by_line):

454

def find(cls, tokens_by_line):

455

"""Find the first help command (foo?) in the cell.

455

"""Find the first help command (foo?) in the cell.

456

"""

456

"""

457

for line in tokens_by_line:

457

for line in tokens_by_line:

458

# Last token is NEWLINE; look at last but one

458

# Last token is NEWLINE; look at last but one

459

if len(line) > 2 and line[-2].string == '?':

459

if len(line) > 2 and line[-2].string == '?':

460

# Find the first token that's not INDENT/DEDENT

460

# Find the first token that's not INDENT/DEDENT

461

ix = 0

461

ix = 0

462

while line[ix].type in {tokenize.INDENT, tokenize.DEDENT}:

462

while line[ix].type in {tokenize.INDENT, tokenize.DEDENT}:

463

ix += 1

463

ix += 1

464

return cls(line[ix].start, line[-2].start)

464

return cls(line[ix].start, line[-2].start)

465

466

def transform(self, lines):

466

def transform(self, lines):

467

"""Transform a help command found by the ``find()`` classmethod.

467

"""Transform a help command found by the ``find()`` classmethod.

468

"""

468

"""

469

piece = ''.join(lines[self.start_line:self.q_line+1])

469

piece = ''.join(lines[self.start_line:self.q_line+1])

470

indent, content = piece[:self.start_col], piece[self.start_col:]

470

indent, content = piece[:self.start_col], piece[self.start_col:]

471

lines_before = lines[:self.start_line]

471

lines_before = lines[:self.start_line]

472

lines_after = lines[self.q_line + 1:]

472

lines_after = lines[self.q_line + 1:]

473

474

m = _help_end_re.search(content)

474

m = _help_end_re.search(content)

475

if not m:

475

if not m:

476

raise SyntaxError(content)

476

raise SyntaxError(content)

477

assert m is not None, content

477

assert m is not None, content

478

target = m.group(1)

478

target = m.group(1)

479

esc = m.group(3)

479

esc = m.group(3)

480

481

# If we're mid-command, put it back on the next prompt for the user.

481

# If we're mid-command, put it back on the next prompt for the user.

482

next_input = None

482

next_input = None

483

if (not lines_before) and (not lines_after) \

483

if (not lines_before) and (not lines_after) \

484

and content.strip() != m.group(0):

484

and content.strip() != m.group(0):

485

next_input = content.rstrip('?\n')

485

next_input = content.rstrip('?\n')

486

487

call = _make_help_call(target, esc, next_input=next_input)

487

call = _make_help_call(target, esc, next_input=next_input)

488

new_line = indent + call + '\n'

488

new_line = indent + call + '\n'

489

490

return lines_before + [new_line] + lines_after

490

return lines_before + [new_line] + lines_after

491

492

def make_tokens_by_line(lines:List[str]):

492

def make_tokens_by_line(lines:List[str]):

493

"""Tokenize a series of lines and group tokens by line.

493

"""Tokenize a series of lines and group tokens by line.

494

495

The tokens for a multiline Python string or expression are grouped as one

495

The tokens for a multiline Python string or expression are grouped as one

496

line. All lines except the last lines should keep their line ending ('\\n',

496

line. All lines except the last lines should keep their line ending ('\\n',

497

'\\r\\n') for this to properly work. Use `.splitlines(keeplineending=True)`

497

'\\r\\n') for this to properly work. Use `.splitlines(keeplineending=True)`

498

for example when passing block of text to this function.

498

for example when passing block of text to this function.

499

500

"""

500

"""

501

# NL tokens are used inside multiline expressions, but also after blank

501

# NL tokens are used inside multiline expressions, but also after blank

502

# lines or comments. This is intentional - see https://bugs.python.org/issue17061

502

# lines or comments. This is intentional - see https://bugs.python.org/issue17061

503

# We want to group the former case together but split the latter, so we

503

# We want to group the former case together but split the latter, so we

504

# track parentheses level, similar to the internals of tokenize.

504

# track parentheses level, similar to the internals of tokenize.

505

506

# reexported from token on 3.7+

506

# reexported from token on 3.7+

507

NEWLINE, NL = tokenize.NEWLINE, tokenize.NL # type: ignore

507

NEWLINE, NL = tokenize.NEWLINE, tokenize.NL # type: ignore

508

tokens_by_line:List[List[Any]] = [[]]

508

tokens_by_line:List[List[Any]] = [[]]

509

if len(lines) > 1 and not lines[0].endswith(('\n', '\r', '\r\n', '\x0b', '\x0c')):

509

if len(lines) > 1 and not lines[0].endswith(('\n', '\r', '\r\n', '\x0b', '\x0c')):

510

warnings.warn("`make_tokens_by_line` received a list of lines which do not have lineending markers ('\\n', '\\r', '\\r\\n', '\\x0b', '\\x0c'), behavior will be unspecified")

510

warnings.warn("`make_tokens_by_line` received a list of lines which do not have lineending markers ('\\n', '\\r', '\\r\\n', '\\x0b', '\\x0c'), behavior will be unspecified")

511

parenlev = 0

511

parenlev = 0

512

try:

512

try:

513

for token in tokenize.generate_tokens(iter(lines).__next__):

513

for token in tokenize.generate_tokens(iter(lines).__next__):

514

tokens_by_line[-1].append(token)

514

tokens_by_line[-1].append(token)

515

if (token.type == NEWLINE) \

515

if (token.type == NEWLINE) \

516

or ((token.type == NL) and (parenlev <= 0)):

516

or ((token.type == NL) and (parenlev <= 0)):

517

tokens_by_line.append([])

517

tokens_by_line.append([])

518

elif token.string in {'(', '[', '{'}:

518

elif token.string in {'(', '[', '{'}:

519

parenlev += 1

519

parenlev += 1

520

elif token.string in {')', ']', '}'}:

520

elif token.string in {')', ']', '}'}:

521

if parenlev > 0:

521

if parenlev > 0:

522

parenlev -= 1

522

parenlev -= 1

523

except tokenize.TokenError:

523

except tokenize.TokenError:

524

# Input ended in a multiline string or expression. That's OK for us.

524

# Input ended in a multiline string or expression. That's OK for us.

525

pass

525

pass

526

527

528

if not tokens_by_line[-1]:

528

if not tokens_by_line[-1]:

529

tokens_by_line.pop()

529

tokens_by_line.pop()

530

531

532

return tokens_by_line

532

return tokens_by_line

533

534

535

def has_sunken_brackets(tokens: List[tokenize.TokenInfo]):

535

def has_sunken_brackets(tokens: List[tokenize.TokenInfo]):

536

"""Check if the depth of brackets in the list of tokens drops below 0"""

536

"""Check if the depth of brackets in the list of tokens drops below 0"""

537

parenlev = 0

537

parenlev = 0

538

for token in tokens:

538

for token in tokens:

539

if token.string in {"(", "[", "{"}:

539

if token.string in {"(", "[", "{"}:

540

parenlev += 1

540

parenlev += 1

541

elif token.string in {")", "]", "}"}:

541

elif token.string in {")", "]", "}"}:

542

parenlev -= 1

542

parenlev -= 1

543

if parenlev < 0:

543

if parenlev < 0:

544

return True

544

return True

545

return False

545

return False

546

547

548

def show_linewise_tokens(s: str):

548

def show_linewise_tokens(s: str):

549

"""For investigation and debugging"""

549

"""For investigation and debugging"""

550

if not s.endswith('\n'):

550

if not s.endswith('\n'):

551

s += '\n'

551

s += '\n'

552

lines = s.splitlines(keepends=True)

552

lines = s.splitlines(keepends=True)

553

for line in make_tokens_by_line(lines):

553

for line in make_tokens_by_line(lines):

554

print("Line -------")

554

print("Line -------")

555

for tokinfo in line:

555

for tokinfo in line:

556

print(" ", tokinfo)

556

print(" ", tokinfo)

557

558

# Arbitrary limit to prevent getting stuck in infinite loops

558

# Arbitrary limit to prevent getting stuck in infinite loops

559

TRANSFORM_LOOP_LIMIT = 500

559

TRANSFORM_LOOP_LIMIT = 500

560

561

class TransformerManager:

561

class TransformerManager:

562

"""Applies various transformations to a cell or code block.

562

"""Applies various transformations to a cell or code block.

563

564

The key methods for external use are ``transform_cell()``

564

The key methods for external use are ``transform_cell()``

565

and ``check_complete()``.

565

and ``check_complete()``.

566

"""

566

"""

567

def __init__(self):

567

def __init__(self):

568

self.cleanup_transforms = [

568

self.cleanup_transforms = [

569

leading_empty_lines,

569

leading_empty_lines,

570

leading_indent,

570

leading_indent,

571

classic_prompt,

571

classic_prompt,

572

ipython_prompt,

572

ipython_prompt,

573

]

573

]

574

self.line_transforms = [

574

self.line_transforms = [

575

cell_magic,

575

cell_magic,

576

]

576

]

577

self.token_transformers = [

577

self.token_transformers = [

578

MagicAssign,

578

MagicAssign,

579

SystemAssign,

579

SystemAssign,

580

EscapedCommand,

580

EscapedCommand,

581

HelpEnd,

581

HelpEnd,

582

]

582

]

583

584

def do_one_token_transform(self, lines):

584

def do_one_token_transform(self, lines):

585

"""Find and run the transform earliest in the code.

585

"""Find and run the transform earliest in the code.

586

587

Returns (changed, lines).

587

Returns (changed, lines).

588

589

This method is called repeatedly until changed is False, indicating

589

This method is called repeatedly until changed is False, indicating

590

that all available transformations are complete.

590

that all available transformations are complete.

591

592

The tokens following IPython special syntax might not be valid, so

592

The tokens following IPython special syntax might not be valid, so

593

the transformed code is retokenised every time to identify the next

593

the transformed code is retokenised every time to identify the next

594

piece of special syntax. Hopefully long code cells are mostly valid

594

piece of special syntax. Hopefully long code cells are mostly valid

595

Python, not using lots of IPython special syntax, so this shouldn't be

595

Python, not using lots of IPython special syntax, so this shouldn't be

596

a performance issue.

596

a performance issue.

597

"""

597

"""

598

tokens_by_line = make_tokens_by_line(lines)

598

tokens_by_line = make_tokens_by_line(lines)

599

candidates = []

599

candidates = []

600

for transformer_cls in self.token_transformers:

600

for transformer_cls in self.token_transformers:

601

transformer = transformer_cls.find(tokens_by_line)

601

transformer = transformer_cls.find(tokens_by_line)

602

if transformer:

602

if transformer:

603

candidates.append(transformer)

603

candidates.append(transformer)

604

605

if not candidates:

605

if not candidates:

606

# Nothing to transform

606

# Nothing to transform

607

return False, lines

607

return False, lines

608

ordered_transformers = sorted(candidates, key=TokenTransformBase.sortby)

608

ordered_transformers = sorted(candidates, key=TokenTransformBase.sortby)

609

for transformer in ordered_transformers:

609

for transformer in ordered_transformers:

610

try:

610

try:

611

return True, transformer.transform(lines)

611

return True, transformer.transform(lines)

612

except SyntaxError:

612

except SyntaxError:

613

pass

613

pass

614

return False, lines

614

return False, lines

615

616

def do_token_transforms(self, lines):

616

def do_token_transforms(self, lines):

617

for _ in range(TRANSFORM_LOOP_LIMIT):

617

for _ in range(TRANSFORM_LOOP_LIMIT):

618

changed, lines = self.do_one_token_transform(lines)

618

changed, lines = self.do_one_token_transform(lines)

619

if not changed:

619

if not changed:

620

return lines

620

return lines

621

622

raise RuntimeError("Input transformation still changing after "

622

raise RuntimeError("Input transformation still changing after "

623

"%d iterations. Aborting." % TRANSFORM_LOOP_LIMIT)

623

"%d iterations. Aborting." % TRANSFORM_LOOP_LIMIT)

624

625

def transform_cell(self, cell: str) -> str:

625

def transform_cell(self, cell: str) -> str:

626

"""Transforms a cell of input code"""

626

"""Transforms a cell of input code"""

627

if not cell.endswith('\n'):

627

if not cell.endswith('\n'):

628

cell += '\n' # Ensure the cell has a trailing newline

628

cell += '\n' # Ensure the cell has a trailing newline

629

lines = cell.splitlines(keepends=True)

629

lines = cell.splitlines(keepends=True)

630

for transform in self.cleanup_transforms + self.line_transforms:

630

for transform in self.cleanup_transforms + self.line_transforms:

631

lines = transform(lines)

631

lines = transform(lines)

632

633

lines = self.do_token_transforms(lines)

633

lines = self.do_token_transforms(lines)

634

return ''.join(lines)

634

return ''.join(lines)

635

636

def check_complete(self, cell: str):

636

def check_complete(self, cell: str):

637

"""Return whether a block of code is ready to execute, or should be continued

637

"""Return whether a block of code is ready to execute, or should be continued

638

639

Parameters

639

Parameters

640

----------

640

----------

641

source : string

641

source : string

642

Python input code, which can be multiline.

642

Python input code, which can be multiline.

643

644

Returns

644

Returns

645

-------

645

-------

646

status : str

646

status : str

647

One of 'complete', 'incomplete', or 'invalid' if source is not a

647

One of 'complete', 'incomplete', or 'invalid' if source is not a

648

prefix of valid code.

648

prefix of valid code.

649

indent_spaces : int or None

649

indent_spaces : int or None

650

The number of spaces by which to indent the next line of code. If

650

The number of spaces by which to indent the next line of code. If

651

status is not 'incomplete', this is None.

651

status is not 'incomplete', this is None.

652

"""

652

"""

653

# Remember if the lines ends in a new line.

653

# Remember if the lines ends in a new line.

654

ends_with_newline = False

654

ends_with_newline = False

655

for character in reversed(cell):

655

for character in reversed(cell):

656

if character == '\n':

656

if character == '\n':

657

ends_with_newline = True

657

ends_with_newline = True

658

break

658

break

659

elif character.strip():

659

elif character.strip():

660

break

660

break

661

else:

661

else:

662

continue

662

continue

663

664

if not ends_with_newline:

664

if not ends_with_newline:

665

# Append an newline for consistent tokenization

665

# Append an newline for consistent tokenization

666

# See https://bugs.python.org/issue33899

666

# See https://bugs.python.org/issue33899

667

cell += '\n'

667

cell += '\n'

668

669

lines = cell.splitlines(keepends=True)

669

lines = cell.splitlines(keepends=True)

670

671

if not lines:

671

if not lines:

672

return 'complete', None

672

return 'complete', None

673

674

if lines[-1].endswith('\\'):

674

if lines[-1].endswith('\\'):

675

# Explicit backslash continuation

675

# Explicit backslash continuation

676

return 'incomplete', find_last_indent(lines)

676

return 'incomplete', find_last_indent(lines)

677

678

try:

678

try:

679

for transform in self.cleanup_transforms:

679

for transform in self.cleanup_transforms:

680

if not getattr(transform, 'has_side_effects', False):

680

if not getattr(transform, 'has_side_effects', False):

681

lines = transform(lines)

681

lines = transform(lines)

682

except SyntaxError:

682

except SyntaxError:

683

return 'invalid', None

683

return 'invalid', None

684

685

if lines[0].startswith('%%'):

685

if lines[0].startswith('%%'):

686

# Special case for cell magics - completion marked by blank line

686

# Special case for cell magics - completion marked by blank line

687

if lines[-1].strip():

687

if lines[-1].strip():

688

return 'incomplete', find_last_indent(lines)

688

return 'incomplete', find_last_indent(lines)

689

else:

689

else:

690

return 'complete', None

690

return 'complete', None

691

692

try:

692

try:

693

for transform in self.line_transforms:

693

for transform in self.line_transforms:

694

if not getattr(transform, 'has_side_effects', False):

694

if not getattr(transform, 'has_side_effects', False):

695

lines = transform(lines)

695

lines = transform(lines)

696

lines = self.do_token_transforms(lines)

696

lines = self.do_token_transforms(lines)

697

except SyntaxError:

697

except SyntaxError:

698

return 'invalid', None

698

return 'invalid', None

699

700

tokens_by_line = make_tokens_by_line(lines)

700

tokens_by_line = make_tokens_by_line(lines)

701

702

# Bail if we got one line and there are more closing parentheses than

702

# Bail if we got one line and there are more closing parentheses than

703

# the opening ones

703

# the opening ones

704

if (

704

if (

705

len(lines) == 1

705

len(lines) == 1

706

and tokens_by_line

706

and tokens_by_line

707

and has_sunken_brackets(tokens_by_line[0])

707

and has_sunken_brackets(tokens_by_line[0])

708

):

708

):

709

return "invalid", None

709

return "invalid", None

710

711

if not tokens_by_line:

711

if not tokens_by_line:

712

return 'incomplete', find_last_indent(lines)

712

return 'incomplete', find_last_indent(lines)

713

714

if tokens_by_line[-1][-1].type != tokenize.ENDMARKER:

714

if tokens_by_line[-1][-1].type != tokenize.ENDMARKER:

715

# We're in a multiline string or expression

715

# We're in a multiline string or expression

716

return 'incomplete', find_last_indent(lines)

716

return 'incomplete', find_last_indent(lines)

717

718

newline_types = {tokenize.NEWLINE, tokenize.COMMENT, tokenize.ENDMARKER} # type: ignore

718

newline_types = {tokenize.NEWLINE, tokenize.COMMENT, tokenize.ENDMARKER} # type: ignore

719

720

# Pop the last line which only contains DEDENTs and ENDMARKER

720

# Pop the last line which only contains DEDENTs and ENDMARKER

721

last_token_line = None

721

last_token_line = None

722

if {t.type for t in tokens_by_line[-1]} in [

722

if {t.type for t in tokens_by_line[-1]} in [

723

{tokenize.DEDENT, tokenize.ENDMARKER},

723

{tokenize.DEDENT, tokenize.ENDMARKER},

724

{tokenize.ENDMARKER}

724

{tokenize.ENDMARKER}

725

] and len(tokens_by_line) > 1:

725

] and len(tokens_by_line) > 1:

726

last_token_line = tokens_by_line.pop()

726

last_token_line = tokens_by_line.pop()

727

728

while tokens_by_line[-1] and tokens_by_line[-1][-1].type in newline_types:

728

while tokens_by_line[-1] and tokens_by_line[-1][-1].type in newline_types:

729

tokens_by_line[-1].pop()

729

tokens_by_line[-1].pop()

730

731

if not tokens_by_line[-1]:

731

if not tokens_by_line[-1]:

732

return 'incomplete', find_last_indent(lines)

732

return 'incomplete', find_last_indent(lines)

733

734

if tokens_by_line[-1][-1].string == ':':

734

if tokens_by_line[-1][-1].string == ':':

735

# The last line starts a block (e.g. 'if foo:')

735

# The last line starts a block (e.g. 'if foo:')

736

ix = 0

736

ix = 0

737

while tokens_by_line[-1][ix].type in {tokenize.INDENT, tokenize.DEDENT}:

737

while tokens_by_line[-1][ix].type in {tokenize.INDENT, tokenize.DEDENT}:

738

ix += 1

738

ix += 1

739

740

indent = tokens_by_line[-1][ix].start[1]

740

indent = tokens_by_line[-1][ix].start[1]

741

return 'incomplete', indent + 4

741

return 'incomplete', indent + 4

742

743

if tokens_by_line[-1][0].line.endswith('\\'):

743

if tokens_by_line[-1][0].line.endswith('\\'):

744

return 'incomplete', None

744

return 'incomplete', None

745

746

# At this point, our checks think the code is complete (or invalid).

746

# At this point, our checks think the code is complete (or invalid).

747

# We'll use codeop.compile_command to check this with the real parser

747

# We'll use codeop.compile_command to check this with the real parser

748

try:

748

try:

749

with warnings.catch_warnings():

749

with warnings.catch_warnings():

750

warnings.simplefilter('error', SyntaxWarning)

750

warnings.simplefilter('error', SyntaxWarning)

751

res = compile_command(''.join(lines), symbol='exec')

751

res = compile_command(''.join(lines), symbol='exec')

752

except (SyntaxError, OverflowError, ValueError, TypeError,

752

except (SyntaxError, OverflowError, ValueError, TypeError,

753

MemoryError, SyntaxWarning):

753

MemoryError, SyntaxWarning):

754

return 'invalid', None

754

return 'invalid', None

755

else:

755

else:

756

if res is None:

756

if res is None:

757

return 'incomplete', find_last_indent(lines)

757

return 'incomplete', find_last_indent(lines)

758

759

if last_token_line and last_token_line[0].type == tokenize.DEDENT:

759

if last_token_line and last_token_line[0].type == tokenize.DEDENT:

760

if ends_with_newline:

760

if ends_with_newline:

761

return 'complete', None

761

return 'complete', None

762

return 'incomplete', find_last_indent(lines)

762

return 'incomplete', find_last_indent(lines)

763

764

# If there's a blank line at the end, assume we're ready to execute

764

# If there's a blank line at the end, assume we're ready to execute

765

if not lines[-1].strip():

765

if not lines[-1].strip():

766

return 'complete', None

766

return 'complete', None

767

768

return 'complete', None

768

return 'complete', None

769

770

771

def find_last_indent(lines):

771

def find_last_indent(lines):

772

m = _indent_re.match(lines[-1])

772

m = _indent_re.match(lines[-1])

773

if not m:

773

if not m:

774

return 0

774

return 0

775

return len(m.group(0).replace('\t', ' '*4))

775

return len(m.group(0).replace('\t', ' '*4))

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages

             """Input transformer machinery to support IPython special syntax.
             This includes the machinery to recognise and transform ``%magic`` commands,
             ``!system`` commands, ``help?`` querying, prompt stripping, and so forth.
             Added: IPython 7.0. Replaces inputsplitter and inputtransformer which were
             deprecated in 7.0.
             """
             # Copyright (c) IPython Development Team.
             # Distributed under the terms of the Modified BSD License.
             from codeop import compile_command
             import re
             import tokenize
             from typing import List, Tuple, Optional, Any
             import warnings
             _indent_re = re.compile(r'^[ \t]+')
             def leading_empty_lines(lines):
                 """Remove leading empty lines
                 If the leading lines are empty or contain only whitespace, they will be
                 removed.
                 """
                 if not lines:
                     return lines
                 for i, line in enumerate(lines):
                     if line and not line.isspace():
                         return lines[i:]
                 return lines
             def leading_indent(lines):
                 """Remove leading indentation.
                 If the first line starts with a spaces or tabs, the same whitespace will be
                 removed from each following line in the cell.
                 """
                 if not lines:
                     return lines
                 m = _indent_re.match(lines[0])
                 if not m:
                     return lines
                 space = m.group(0)
                 n = len(space)
                 return [l[n:] if l.startswith(space) else l
                         for l in lines]
             class PromptStripper:
                 """Remove matching input prompts from a block of input.
                 Parameters
                 ----------
                 prompt_re : regular expression
                     A regular expression matching any input prompt (including continuation,
                     e.g. ``...``)
                 initial_re : regular expression, optional
                     A regular expression matching only the initial prompt, but not continuation.
                     If no initial expression is given, prompt_re will be used everywhere.
                     Used mainly for plain Python prompts (``>>>``), where the continuation prompt
                     ``...`` is a valid Python expression in Python 3, so shouldn't be stripped.
                 Notes
                 -----
                 If initial_re and prompt_re differ,
                 only initial_re will be tested against the first line.
                 If any prompt is found on the first two lines,
                 prompts will be stripped from the rest of the block.
                 """
                 def __init__(self, prompt_re, initial_re=None):
                     self.prompt_re = prompt_re
                     self.initial_re = initial_re or prompt_re
                 def _strip(self, lines):
                     return [self.prompt_re.sub('', l, count=1) for l in lines]
                 def __call__(self, lines):
                     if not lines:
                         return lines
                     if self.initial_re.match(lines[0]) or \
                             (len(lines) > 1 and self.prompt_re.match(lines[1])):
                         return self._strip(lines)
                     return lines
             classic_prompt = PromptStripper(
                 prompt_re=re.compile(r'^(>>>|\.\.\.)( |$)'),
                 initial_re=re.compile(r'^>>>( |$)')
             )
             ipython_prompt = PromptStripper(
                 re.compile(
                     r"""
-                ^(                         # Match from the beginning of a line, either:
+                    ^(                         # Match from the beginning of a line, either:
-                                           # 1. First-line prompt:
+                                               # 1. First-line prompt:
-                ((\[nav\]|\[ins\])?\ )?    # Vi editing mode prompt, if it's there
+                    ((\[nav\]|\[ins\])?\ )?    # Vi editing mode prompt, if it's there
-                In\                        # The 'In' of the prompt, with a space
+                    In\                        # The 'In' of the prompt, with a space
-                \[\d+\]:                   # Command index, as displayed in the prompt
+                    \[\d+\]:                   # Command index, as displayed in the prompt
-                \                          # With a mandatory trailing space
+                    \                          # With a mandatory trailing space
-                |                          # ... or ...
+                    |                          # ... or ...
-                                           # 2. The three dots of the multiline prompt
+                                               # 2. The three dots of the multiline prompt
-                \s*                        # All leading whitespace characters
+                    \s*                        # All leading whitespace characters
-                \.{3,}:                    # The three (or more) dots
+                    \.{3,}:                    # The three (or more) dots
-                \ ?                        # With an optional trailing space
+                    \ ?                        # With an optional trailing space
+                    )
-                """,
+                    """,
                     re.VERBOSE,
                 )
             )
             def cell_magic(lines):
                 if not lines or not lines[0].startswith('%%'):
                     return lines
                 if re.match(r'%%\w+\?', lines[0]):
                     # This case will be handled by help_end
                     return lines
                 magic_name, _, first_line = lines[0][2:].rstrip().partition(' ')
                 body = ''.join(lines[1:])
                 return ['get_ipython().run_cell_magic(%r, %r, %r)\n'
                         % (magic_name, first_line, body)]
             def _find_assign_op(token_line) -> Optional[int]:
                 """Get the index of the first assignment in the line ('=' not inside brackets)
                 Note: We don't try to support multiple special assignment (a = b = %foo)
                 """
                 paren_level = 0
                 for i, ti in enumerate(token_line):
                     s = ti.string
                     if s == '=' and paren_level == 0:
                         return i
                     if s in {'(','[','{'}:
                         paren_level += 1
                     elif s in {')', ']', '}'}:
                         if paren_level > 0:
                             paren_level -= 1
                 return None
             def find_end_of_continued_line(lines, start_line: int):
                 """Find the last line of a line explicitly extended using backslashes.
                 Uses 0-indexed line numbers.
                 """
                 end_line = start_line
                 while lines[end_line].endswith('\\\n'):
                     end_line += 1
                     if end_line >= len(lines):
                         break
                 return end_line
             def assemble_continued_line(lines, start: Tuple[int, int], end_line: int):
                 r"""Assemble a single line from multiple continued line pieces
                 Continued lines are lines ending in ``\``, and the line following the last
                 ``\`` in the block.
                 For example, this code continues over multiple lines::
                     if (assign_ix is not None) \
                          and (len(line) >= assign_ix + 2) \
                          and (line[assign_ix+1].string == '%') \
                          and (line[assign_ix+2].type == tokenize.NAME):
                 This statement contains four continued line pieces.
                 Assembling these pieces into a single line would give::
                     if (assign_ix is not None) and (len(line) >= assign_ix + 2) and (line[...
                 This uses 0-indexed line numbers. *start* is (lineno, colno).
                 Used to allow ``%magic`` and ``!system`` commands to be continued over
                 multiple lines.
                 """
                 parts = [lines[start[0]][start[1]:]] + lines[start[0]+1:end_line+1]
                 return ' '.join([p.rstrip()[:-1] for p in parts[:-1]]  # Strip backslash+newline
                                 + [parts[-1].rstrip()])         # Strip newline from last line
             class TokenTransformBase:
                 """Base class for transformations which examine tokens.
                 Special syntax should not be transformed when it occurs inside strings or
                 comments. This is hard to reliably avoid with regexes. The solution is to
                 tokenise the code as Python, and recognise the special syntax in the tokens.
                 IPython's special syntax is not valid Python syntax, so tokenising may go
                 wrong after the special syntax starts. These classes therefore find and
                 transform *one* instance of special syntax at a time into regular Python
                 syntax. After each transformation, tokens are regenerated to find the next
                 piece of special syntax.
                 Subclasses need to implement one class method (find)
                 and one regular method (transform).
                 The priority attribute can select which transformation to apply if multiple
                 transformers match in the same place. Lower numbers have higher priority.
                 This allows "%magic?" to be turned into a help call rather than a magic call.
                 """
                 # Lower numbers -> higher priority (for matches in the same location)
                 priority = 10
                 def sortby(self):
                     return self.start_line, self.start_col, self.priority
                 def __init__(self, start):
                     self.start_line = start[0] - 1   # Shift from 1-index to 0-index
                     self.start_col = start[1]
                 @classmethod
                 def find(cls, tokens_by_line):
                     """Find one instance of special syntax in the provided tokens.
                     Tokens are grouped into logical lines for convenience,
                     so it is easy to e.g. look at the first token of each line.
                     *tokens_by_line* is a list of lists of tokenize.TokenInfo objects.
                     This should return an instance of its class, pointing to the start
                     position it has found, or None if it found no match.
                     """
                     raise NotImplementedError
                 def transform(self, lines: List[str]):
                     """Transform one instance of special syntax found by ``find()``
                     Takes a list of strings representing physical lines,
                     returns a similar list of transformed lines.
                     """
                     raise NotImplementedError
             class MagicAssign(TokenTransformBase):
                 """Transformer for assignments from magics (a = %foo)"""
                 @classmethod
                 def find(cls, tokens_by_line):
                     """Find the first magic assignment (a = %foo) in the cell.
                     """
                     for line in tokens_by_line:
                         assign_ix = _find_assign_op(line)
                         if (assign_ix is not None) \
                                 and (len(line) >= assign_ix + 2) \
                                 and (line[assign_ix+1].string == '%') \
                                 and (line[assign_ix+2].type == tokenize.NAME):
                             return cls(line[assign_ix+1].start)
                 def transform(self, lines: List[str]):
                     """Transform a magic assignment found by the ``find()`` classmethod.
                     """
                     start_line, start_col = self.start_line, self.start_col
                     lhs = lines[start_line][:start_col]
                     end_line = find_end_of_continued_line(lines, start_line)
                     rhs = assemble_continued_line(lines, (start_line, start_col), end_line)
                     assert rhs.startswith('%'), rhs
                     magic_name, _, args = rhs[1:].partition(' ')
                     lines_before = lines[:start_line]
                     call = "get_ipython().run_line_magic({!r}, {!r})".format(magic_name, args)
                     new_line = lhs + call + '\n'
                     lines_after = lines[end_line+1:]
                     return lines_before + [new_line] + lines_after
             class SystemAssign(TokenTransformBase):
                 """Transformer for assignments from system commands (a = !foo)"""
                 @classmethod
                 def find(cls, tokens_by_line):
                     """Find the first system assignment (a = !foo) in the cell.
                     """
                     for line in tokens_by_line:
                         assign_ix = _find_assign_op(line)
                         if (assign_ix is not None) \
                                 and not line[assign_ix].line.strip().startswith('=') \
                                 and (len(line) >= assign_ix + 2) \
                                 and (line[assign_ix + 1].type == tokenize.ERRORTOKEN):
                             ix = assign_ix + 1
                             while ix < len(line) and line[ix].type == tokenize.ERRORTOKEN:
                                 if line[ix].string == '!':
                                     return cls(line[ix].start)
                                 elif not line[ix].string.isspace():
                                     break
                                 ix += 1
                 def transform(self, lines: List[str]):
                     """Transform a system assignment found by the ``find()`` classmethod.
                     """
                     start_line, start_col = self.start_line, self.start_col
                     lhs = lines[start_line][:start_col]
                     end_line = find_end_of_continued_line(lines, start_line)
                     rhs = assemble_continued_line(lines, (start_line, start_col), end_line)
                     assert rhs.startswith('!'), rhs
                     cmd = rhs[1:]
                     lines_before = lines[:start_line]
                     call = "get_ipython().getoutput({!r})".format(cmd)
                     new_line = lhs + call + '\n'
                     lines_after = lines[end_line + 1:]
                     return lines_before + [new_line] + lines_after
             # The escape sequences that define the syntax transformations IPython will
             # apply to user input.  These can NOT be just changed here: many regular
             # expressions and other parts of the code may use their hardcoded values, and
             # for all intents and purposes they constitute the 'IPython syntax', so they
             # should be considered fixed.
             ESC_SHELL  = '!'     # Send line to underlying system shell
             ESC_SH_CAP = '!!'    # Send line to system shell and capture output
             ESC_HELP   = '?'     # Find information about object
             ESC_HELP2  = '??'    # Find extra-detailed information about object
             ESC_MAGIC  = '%'     # Call magic function
             ESC_MAGIC2 = '%%'    # Call cell-magic function
             ESC_QUOTE  = ','     # Split args on whitespace, quote each as string and call
             ESC_QUOTE2 = ';'     # Quote all args as a single string, call
             ESC_PAREN  = '/'     # Call first argument with rest of line as arguments
             ESCAPE_SINGLES = {'!', '?', '%', ',', ';', '/'}
             ESCAPE_DOUBLES = {'!!', '??'}  # %% (cell magic) is handled separately
             def _make_help_call(target, esc, next_input=None):
                 """Prepares a pinfo(2)/psearch call from a target name and the escape
                 (i.e. ? or ??)"""
                 method  = 'pinfo2' if esc == '??' \
                             else 'psearch' if '*' in target \
                             else 'pinfo'
                 arg = " ".join([method, target])
                 #Prepare arguments for get_ipython().run_line_magic(magic_name, magic_args)
                 t_magic_name, _, t_magic_arg_s = arg.partition(' ')
                 t_magic_name = t_magic_name.lstrip(ESC_MAGIC)
                 if next_input is None:
                     return 'get_ipython().run_line_magic(%r, %r)' % (t_magic_name, t_magic_arg_s)
                 else:
                     return 'get_ipython().set_next_input(%r);get_ipython().run_line_magic(%r, %r)' % \
                        (next_input, t_magic_name, t_magic_arg_s)
             def _tr_help(content):
                 """Translate lines escaped with: ?
                 A naked help line should fire the intro help screen (shell.show_usage())
                 """
                 if not content:
                     return 'get_ipython().show_usage()'
                 return _make_help_call(content, '?')
             def _tr_help2(content):
                 """Translate lines escaped with: ??
                 A naked help line should fire the intro help screen (shell.show_usage())
                 """
                 if not content:
                     return 'get_ipython().show_usage()'
                 return _make_help_call(content, '??')
             def _tr_magic(content):
                 "Translate lines escaped with a percent sign: %"
                 name, _, args = content.partition(' ')
                 return 'get_ipython().run_line_magic(%r, %r)' % (name, args)
             def _tr_quote(content):
                 "Translate lines escaped with a comma: ,"
                 name, _, args = content.partition(' ')
                 return '%s("%s")' % (name, '", "'.join(args.split()) )
             def _tr_quote2(content):
                 "Translate lines escaped with a semicolon: ;"
                 name, _, args = content.partition(' ')
                 return '%s("%s")' % (name, args)
             def _tr_paren(content):
                 "Translate lines escaped with a slash: /"
                 name, _, args = content.partition(' ')
                 return '%s(%s)' % (name, ", ".join(args.split()))
             tr = { ESC_SHELL  : 'get_ipython().system({!r})'.format,
                    ESC_SH_CAP : 'get_ipython().getoutput({!r})'.format,
                    ESC_HELP   : _tr_help,
                    ESC_HELP2  : _tr_help2,
                    ESC_MAGIC  : _tr_magic,
                    ESC_QUOTE  : _tr_quote,
                    ESC_QUOTE2 : _tr_quote2,
                    ESC_PAREN  : _tr_paren }
             class EscapedCommand(TokenTransformBase):
                 """Transformer for escaped commands like %foo, !foo, or /foo"""
                 @classmethod
                 def find(cls, tokens_by_line):
                     """Find the first escaped command (%foo, !foo, etc.) in the cell.
                     """
                     for line in tokens_by_line:
                         if not line:
                             continue
                         ix = 0
                         ll = len(line)
                         while ll > ix and line[ix].type in {tokenize.INDENT, tokenize.DEDENT}:
                             ix += 1
                         if ix >= ll:
                             continue
                         if line[ix].string in ESCAPE_SINGLES:
                             return cls(line[ix].start)
                 def transform(self, lines):
                     """Transform an escaped line found by the ``find()`` classmethod.
                     """
                     start_line, start_col = self.start_line, self.start_col
                     indent = lines[start_line][:start_col]
                     end_line = find_end_of_continued_line(lines, start_line)
                     line = assemble_continued_line(lines, (start_line, start_col), end_line)
                     if len(line) > 1 and line[:2] in ESCAPE_DOUBLES:
                         escape, content = line[:2], line[2:]
                     else:
                         escape, content = line[:1], line[1:]
                     if escape in tr:
                         call = tr[escape](content)
                     else:
                         call = ''
                     lines_before = lines[:start_line]
                     new_line = indent + call + '\n'
                     lines_after = lines[end_line + 1:]
                     return lines_before + [new_line] + lines_after
             _help_end_re = re.compile(r"""(%{0,2}
                                           (?!\d)[\w*]+            # Variable name
                                           (\.(?!\d)[\w*]+)*       # .etc.etc
                                           )
                                           (\?\??)$                # ? or ??
                                           """,
                                           re.VERBOSE)
             class HelpEnd(TokenTransformBase):
                 """Transformer for help syntax: obj? and obj??"""
                 # This needs to be higher priority (lower number) than EscapedCommand so
                 # that inspecting magics (%foo?) works.
                 priority = 5
                 def __init__(self, start, q_locn):
                     super().__init__(start)
                     self.q_line = q_locn[0] - 1  # Shift from 1-indexed to 0-indexed
                     self.q_col = q_locn[1]
                 @classmethod
                 def find(cls, tokens_by_line):
                     """Find the first help command (foo?) in the cell.
                     """
                     for line in tokens_by_line:
                         # Last token is NEWLINE; look at last but one
                         if len(line) > 2 and line[-2].string == '?':
                             # Find the first token that's not INDENT/DEDENT
                             ix = 0
                             while line[ix].type in {tokenize.INDENT, tokenize.DEDENT}:
                                 ix += 1
                             return cls(line[ix].start, line[-2].start)
                 def transform(self, lines):
                     """Transform a help command found by the ``find()`` classmethod.
                     """
                     piece = ''.join(lines[self.start_line:self.q_line+1])
                     indent, content = piece[:self.start_col], piece[self.start_col:]
                     lines_before = lines[:self.start_line]
                     lines_after = lines[self.q_line + 1:]
                     m = _help_end_re.search(content)
                     if not m:
                         raise SyntaxError(content)
                     assert m is not None, content
                     target = m.group(1)
                     esc = m.group(3)
                     # If we're mid-command, put it back on the next prompt for the user.
                     next_input = None
                     if (not lines_before) and (not lines_after) \
                             and content.strip() != m.group(0):
                         next_input = content.rstrip('?\n')
                     call = _make_help_call(target, esc, next_input=next_input)
                     new_line = indent + call + '\n'
                     return lines_before + [new_line] + lines_after
             def make_tokens_by_line(lines:List[str]):
                 """Tokenize a series of lines and group tokens by line.
                 The tokens for a multiline Python string or expression are grouped as one
                 line. All lines except the last lines should keep their line ending ('\\n',
                 '\\r\\n') for this to properly work. Use `.splitlines(keeplineending=True)`
                 for example when passing block of text to this function.
                 """
                 # NL tokens are used inside multiline expressions, but also after blank
                 # lines or comments. This is intentional - see https://bugs.python.org/issue17061
                 # We want to group the former case together but split the latter, so we
                 # track parentheses level, similar to the internals of tokenize.
                 #   reexported from token on 3.7+
                 NEWLINE, NL = tokenize.NEWLINE, tokenize.NL  # type: ignore
                 tokens_by_line:List[List[Any]] = [[]]
                 if len(lines) > 1 and not lines[0].endswith(('\n', '\r', '\r\n', '\x0b', '\x0c')):
                     warnings.warn("`make_tokens_by_line` received a list of lines which do not have lineending markers ('\\n', '\\r', '\\r\\n', '\\x0b', '\\x0c'), behavior will be unspecified")
                 parenlev = 0
                 try:
                     for token in tokenize.generate_tokens(iter(lines).__next__):
                         tokens_by_line[-1].append(token)
                         if (token.type == NEWLINE) \
                                 or ((token.type == NL) and (parenlev <= 0)):
                             tokens_by_line.append([])
                         elif token.string in {'(', '[', '{'}:
                             parenlev += 1
                         elif token.string in {')', ']', '}'}:
                             if parenlev > 0:
                                 parenlev -= 1
                 except tokenize.TokenError:
                     # Input ended in a multiline string or expression. That's OK for us.
                     pass
                 if not tokens_by_line[-1]:
                     tokens_by_line.pop()
                 return tokens_by_line
             def has_sunken_brackets(tokens: List[tokenize.TokenInfo]):
                 """Check if the depth of brackets in the list of tokens drops below 0"""
                 parenlev = 0
                 for token in tokens:
                     if token.string in {"(", "[", "{"}:
                         parenlev += 1
                     elif token.string in {")", "]", "}"}:
                         parenlev -= 1
                         if parenlev < 0:
                             return True
                 return False
             def show_linewise_tokens(s: str):
                 """For investigation and debugging"""
                 if not s.endswith('\n'):
                     s += '\n'
                 lines = s.splitlines(keepends=True)
                 for line in make_tokens_by_line(lines):
                     print("Line -------")
                     for tokinfo in line:
                         print(" ", tokinfo)
             # Arbitrary limit to prevent getting stuck in infinite loops
             TRANSFORM_LOOP_LIMIT = 500
             class TransformerManager:
                 """Applies various transformations to a cell or code block.
                 The key methods for external use are ``transform_cell()``
                 and ``check_complete()``.
                 """
                 def __init__(self):
                     self.cleanup_transforms = [
                         leading_empty_lines,
                         leading_indent,
                         classic_prompt,
                         ipython_prompt,
                     ]
                     self.line_transforms = [
                         cell_magic,
                     ]
                     self.token_transformers = [
                         MagicAssign,
                         SystemAssign,
                         EscapedCommand,
                         HelpEnd,
                     ]
                 def do_one_token_transform(self, lines):
                     """Find and run the transform earliest in the code.
                     Returns (changed, lines).
                     This method is called repeatedly until changed is False, indicating
                     that all available transformations are complete.
                     The tokens following IPython special syntax might not be valid, so
                     the transformed code is retokenised every time to identify the next
                     piece of special syntax. Hopefully long code cells are mostly valid
                     Python, not using lots of IPython special syntax, so this shouldn't be
                     a performance issue.
                     """
                     tokens_by_line = make_tokens_by_line(lines)
                     candidates = []
                     for transformer_cls in self.token_transformers:
                         transformer = transformer_cls.find(tokens_by_line)
                         if transformer:
                             candidates.append(transformer)
                     if not candidates:
                         # Nothing to transform
                         return False, lines
                     ordered_transformers = sorted(candidates, key=TokenTransformBase.sortby)
                     for transformer in ordered_transformers:
                         try:
                             return True, transformer.transform(lines)
                         except SyntaxError:
                             pass
                     return False, lines
                 def do_token_transforms(self, lines):
                     for _ in range(TRANSFORM_LOOP_LIMIT):
                         changed, lines = self.do_one_token_transform(lines)
                         if not changed:
                             return lines
                     raise RuntimeError("Input transformation still changing after "
                                        "%d iterations. Aborting." % TRANSFORM_LOOP_LIMIT)
                 def transform_cell(self, cell: str) -> str:
                     """Transforms a cell of input code"""
                     if not cell.endswith('\n'):
                         cell += '\n'  # Ensure the cell has a trailing newline
                     lines = cell.splitlines(keepends=True)
                     for transform in self.cleanup_transforms + self.line_transforms:
                         lines = transform(lines)
                     lines = self.do_token_transforms(lines)
                     return ''.join(lines)
                 def check_complete(self, cell: str):
                     """Return whether a block of code is ready to execute, or should be continued
                     Parameters
                     ----------
                     source : string
                       Python input code, which can be multiline.
                     Returns
                     -------
                     status : str
                       One of 'complete', 'incomplete', or 'invalid' if source is not a
                       prefix of valid code.
                     indent_spaces : int or None
                       The number of spaces by which to indent the next line of code. If
                       status is not 'incomplete', this is None.
                     """
                     # Remember if the lines ends in a new line.
                     ends_with_newline = False
                     for character in reversed(cell):
                         if character == '\n':
                             ends_with_newline = True
                             break
                         elif character.strip():
                             break
                         else:
                             continue
                     if not ends_with_newline:
                         # Append an newline for consistent tokenization
                         # See https://bugs.python.org/issue33899
                         cell += '\n'
                     lines = cell.splitlines(keepends=True)
                     if not lines:
                         return 'complete', None
                     if lines[-1].endswith('\\'):
                         # Explicit backslash continuation
                         return 'incomplete', find_last_indent(lines)
                     try:
                         for transform in self.cleanup_transforms:
                             if not getattr(transform, 'has_side_effects', False):
                                 lines = transform(lines)
                     except SyntaxError:
                         return 'invalid', None
                     if lines[0].startswith('%%'):
                         # Special case for cell magics - completion marked by blank line
                         if lines[-1].strip():
                             return 'incomplete', find_last_indent(lines)
                         else:
                             return 'complete', None
                     try:
                         for transform in self.line_transforms:
                             if not getattr(transform, 'has_side_effects', False):
                                 lines = transform(lines)
                         lines = self.do_token_transforms(lines)
                     except SyntaxError:
                         return 'invalid', None
                     tokens_by_line = make_tokens_by_line(lines)
                     # Bail if we got one line and there are more closing parentheses than
                     # the opening ones
                     if (
                         len(lines) == 1
                         and tokens_by_line
                         and has_sunken_brackets(tokens_by_line[0])
                     ):
                         return "invalid", None
                     if not tokens_by_line:
                         return 'incomplete', find_last_indent(lines)
                     if tokens_by_line[-1][-1].type != tokenize.ENDMARKER:
                         # We're in a multiline string or expression
                         return 'incomplete', find_last_indent(lines)
                     newline_types = {tokenize.NEWLINE, tokenize.COMMENT, tokenize.ENDMARKER} # type: ignore
                     # Pop the last line which only contains DEDENTs and ENDMARKER
                     last_token_line = None
                     if {t.type for t in tokens_by_line[-1]} in [
                         {tokenize.DEDENT, tokenize.ENDMARKER},
                         {tokenize.ENDMARKER}
                     ] and len(tokens_by_line) > 1:
                         last_token_line = tokens_by_line.pop()
                     while tokens_by_line[-1] and tokens_by_line[-1][-1].type in newline_types:
                         tokens_by_line[-1].pop()
                     if not tokens_by_line[-1]:
                         return 'incomplete', find_last_indent(lines)
                     if tokens_by_line[-1][-1].string == ':':
                         # The last line starts a block (e.g. 'if foo:')
                         ix = 0
                         while tokens_by_line[-1][ix].type in {tokenize.INDENT, tokenize.DEDENT}:
                             ix += 1
                         indent = tokens_by_line[-1][ix].start[1]
                         return 'incomplete', indent + 4
                     if tokens_by_line[-1][0].line.endswith('\\'):
                         return 'incomplete', None
                     # At this point, our checks think the code is complete (or invalid).
                     # We'll use codeop.compile_command to check this with the real parser
                     try:
                         with warnings.catch_warnings():
                             warnings.simplefilter('error', SyntaxWarning)
                             res = compile_command(''.join(lines), symbol='exec')
                     except (SyntaxError, OverflowError, ValueError, TypeError,
                             MemoryError, SyntaxWarning):
                         return 'invalid', None
                     else:
                         if res is None:
                             return 'incomplete', find_last_indent(lines)
                     if last_token_line and last_token_line[0].type == tokenize.DEDENT:
                         if ends_with_newline:
                             return 'complete', None
                         return 'incomplete', find_last_indent(lines)
                     # If there's a blank line at the end, assume we're ready to execute
                     if not lines[-1].strip():
                         return 'complete', None
                     return 'complete', None
             def find_last_indent(lines):
                 m = _indent_re.match(lines[-1])
                 if not m:
                     return 0
                 return len(m.group(0).replace('\t', ' '*4))