upstream/ipython Commit - r23333:ccf44ed3

1

"""Input handling and transformation machinery.

1

"""Input handling and transformation machinery.

2

3

The first class in this module, :class:`InputSplitter`, is designed to tell when

3

The first class in this module, :class:`InputSplitter`, is designed to tell when

4

input from a line-oriented frontend is complete and should be executed, and when

4

input from a line-oriented frontend is complete and should be executed, and when

5

the user should be prompted for another line of code instead. The name 'input

5

the user should be prompted for another line of code instead. The name 'input

6

splitter' is largely for historical reasons.

6

splitter' is largely for historical reasons.

7

8

A companion, :class:`IPythonInputSplitter`, provides the same functionality but

8

A companion, :class:`IPythonInputSplitter`, provides the same functionality but

9

with full support for the extended IPython syntax (magics, system calls, etc).

9

with full support for the extended IPython syntax (magics, system calls, etc).

10

The code to actually do these transformations is in :mod:`IPython.core.inputtransformer`.

10

The code to actually do these transformations is in :mod:`IPython.core.inputtransformer`.

11

:class:`IPythonInputSplitter` feeds the raw code to the transformers in order

11

:class:`IPythonInputSplitter` feeds the raw code to the transformers in order

12

and stores the results.

12

and stores the results.

13

14

For more details, see the class docstrings below.

14

For more details, see the class docstrings below.

15

"""

15

"""

16

17

# Copyright (c) IPython Development Team.

17

# Copyright (c) IPython Development Team.

18

# Distributed under the terms of the Modified BSD License.

18

# Distributed under the terms of the Modified BSD License.

19

import ast

19

import ast

20

import codeop

20

import codeop

21

import io

21

import io

22

import re

22

import re

23

import sys

23

import sys

24

import tokenize

24

import tokenize

25

import warnings

25

import warnings

26

27

from IPython.utils.py3compat import cast_unicode

27

from IPython.utils.py3compat import cast_unicode

28

from IPython.core.inputtransformer import (leading_indent,

28

from IPython.core.inputtransformer import (leading_indent,

29

classic_prompt,

29

classic_prompt,

30

ipy_prompt,

30

ipy_prompt,

31

cellmagic,

31

cellmagic,

32

assemble_logical_lines,

32

assemble_logical_lines,

33

help_end,

33

help_end,

34

escaped_commands,

34

escaped_commands,

35

assign_from_magic,

35

assign_from_magic,

36

assign_from_system,

36

assign_from_system,

37

assemble_python_lines,

37

assemble_python_lines,

38

)

38

)

39

40

# These are available in this module for backwards compatibility.

40

# These are available in this module for backwards compatibility.

41

from IPython.core.inputtransformer import (ESC_SHELL, ESC_SH_CAP, ESC_HELP,

41

from IPython.core.inputtransformer import (ESC_SHELL, ESC_SH_CAP, ESC_HELP,

42

ESC_HELP2, ESC_MAGIC, ESC_MAGIC2,

42

ESC_HELP2, ESC_MAGIC, ESC_MAGIC2,

43

ESC_QUOTE, ESC_QUOTE2, ESC_PAREN, ESC_SEQUENCES)

43

ESC_QUOTE, ESC_QUOTE2, ESC_PAREN, ESC_SEQUENCES)

44

45

#-----------------------------------------------------------------------------

45

#-----------------------------------------------------------------------------

46

# Utilities

46

# Utilities

47

#-----------------------------------------------------------------------------

47

#-----------------------------------------------------------------------------

48

49

# FIXME: These are general-purpose utilities that later can be moved to the

49

# FIXME: These are general-purpose utilities that later can be moved to the

50

# general ward. Kept here for now because we're being very strict about test

50

# general ward. Kept here for now because we're being very strict about test

51

# coverage with this code, and this lets us ensure that we keep 100% coverage

51

# coverage with this code, and this lets us ensure that we keep 100% coverage

52

# while developing.

52

# while developing.

53

54

# compiled regexps for autoindent management

54

# compiled regexps for autoindent management

55

dedent_re = re.compile('|'.join([

55

dedent_re = re.compile('|'.join([

56

r'^\s+raise(\s.*)?$', # raise statement (+ space + other stuff, maybe)

56

r'^\s+raise(\s.*)?$', # raise statement (+ space + other stuff, maybe)

57

r'^\s+raise$[^$]*\).*$', # wacky raise with immediate open paren

57

r'^\s+raise$[^$]*\).*$', # wacky raise with immediate open paren

58

r'^\s+return(\s.*)?$', # normal return (+ space + other stuff, maybe)

58

r'^\s+return(\s.*)?$', # normal return (+ space + other stuff, maybe)

59

r'^\s+return$[^$]*\).*$', # wacky return with immediate open paren

59

r'^\s+return$[^$]*\).*$', # wacky return with immediate open paren

60

r'^\s+pass\s*$', # pass (optionally followed by trailing spaces)

60

r'^\s+pass\s*$', # pass (optionally followed by trailing spaces)

61

r'^\s+break\s*$', # break (optionally followed by trailing spaces)

61

r'^\s+break\s*$', # break (optionally followed by trailing spaces)

62

r'^\s+continue\s*$', # continue (optionally followed by trailing spaces)

62

r'^\s+continue\s*$', # continue (optionally followed by trailing spaces)

63

]))

63

]))

64

ini_spaces_re = re.compile(r'^([ \t\r\f\v]+)')

64

ini_spaces_re = re.compile(r'^([ \t\r\f\v]+)')

65

66

# regexp to match pure comment lines so we don't accidentally insert 'if 1:'

66

# regexp to match pure comment lines so we don't accidentally insert 'if 1:'

67

# before pure comments

67

# before pure comments

68

comment_line_re = re.compile('^\s*\#')

68

comment_line_re = re.compile('^\s*\#')

69

70

71

def num_ini_spaces(s):

71

def num_ini_spaces(s):

72

"""Return the number of initial spaces in a string.

72

"""Return the number of initial spaces in a string.

73

74

Note that tabs are counted as a single space. For now, we do *not* support

74

Note that tabs are counted as a single space. For now, we do *not* support

75

mixing of tabs and spaces in the user's input.

75

mixing of tabs and spaces in the user's input.

76

77

Parameters

77

Parameters

78

----------

78

----------

79

s : string

79

s : string

80

81

Returns

81

Returns

82

-------

82

-------

83

n : int

83

n : int

84

"""

84

"""

85

86

ini_spaces = ini_spaces_re.match(s)

86

ini_spaces = ini_spaces_re.match(s)

87

if ini_spaces:

87

if ini_spaces:

88

return ini_spaces.end()

88

return ini_spaces.end()

89

else:

89

else:

90

return 0

90

return 0

91

92

# Fake token types for partial_tokenize:

92

# Fake token types for partial_tokenize:

93

INCOMPLETE_STRING = tokenize.N_TOKENS

93

INCOMPLETE_STRING = tokenize.N_TOKENS

94

IN_MULTILINE_STATEMENT = tokenize.N_TOKENS + 1

94

IN_MULTILINE_STATEMENT = tokenize.N_TOKENS + 1

95

96

# The 2 classes below have the same API as TokenInfo, but don't try to look up

96

# The 2 classes below have the same API as TokenInfo, but don't try to look up

97

# a token type name that they won't find.

97

# a token type name that they won't find.

98

class IncompleteString:

98

class IncompleteString:

99

type = exact_type = INCOMPLETE_STRING

99

type = exact_type = INCOMPLETE_STRING

100

def __init__(self, s, start, end, line):

100

def __init__(self, s, start, end, line):

101

self.s = s

101

self.s = s

102

self.start = start

102

self.start = start

103

self.end = end

103

self.end = end

104

self.line = line

104

self.line = line

105

106

class InMultilineStatement:

106

class InMultilineStatement:

107

type = exact_type = IN_MULTILINE_STATEMENT

107

type = exact_type = IN_MULTILINE_STATEMENT

108

def __init__(self, pos, line):

108

def __init__(self, pos, line):

109

self.s = ''

109

self.s = ''

110

self.start = self.end = pos

110

self.start = self.end = pos

111

self.line = line

111

self.line = line

112

113

def partial_tokens(s):

113

def partial_tokens(s):

114

"""Iterate over tokens from a possibly-incomplete string of code.

114

"""Iterate over tokens from a possibly-incomplete string of code.

115

116

This adds two special token types: INCOMPLETE_STRING and

116

This adds two special token types: INCOMPLETE_STRING and

117

IN_MULTILINE_STATEMENT. These can only occur as the last token yielded, and

117

IN_MULTILINE_STATEMENT. These can only occur as the last token yielded, and

118

represent the two main ways for code to be incomplete.

118

represent the two main ways for code to be incomplete.

119

"""

119

"""

120

readline = io.StringIO(s).readline

120

readline = io.StringIO(s).readline

121

token = tokenize.TokenInfo(tokenize.NEWLINE, '', (1, 0), (1, 0), '')

121

token = tokenize.TokenInfo(tokenize.NEWLINE, '', (1, 0), (1, 0), '')

122

try:

122

try:

123

for token in tokenize.generate_tokens(readline):

123

for token in tokenize.generate_tokens(readline):

124

yield token

124

yield token

125

except tokenize.TokenError as e:

125

except tokenize.TokenError as e:

126

# catch EOF error

126

# catch EOF error

127

lines = s.splitlines(keepends=True)

127

lines = s.splitlines(keepends=True)

128

end = len(lines), len(lines[-1])

128

end = len(lines), len(lines[-1])

129

if 'multi-line string' in e.args[0]:

129

if 'multi-line string' in e.args[0]:

130

l, c = start = token.end

130

l, c = start = token.end

131

s = lines[l-1][c:] + ''.join(lines[l:])

131

s = lines[l-1][c:] + ''.join(lines[l:])

132

yield IncompleteString(s, start, end, lines[-1])

132

yield IncompleteString(s, start, end, lines[-1])

133

elif 'multi-line statement' in e.args[0]:

133

elif 'multi-line statement' in e.args[0]:

134

yield InMultilineStatement(end, lines[-1])

134

yield InMultilineStatement(end, lines[-1])

135

else:

135

else:

136

raise

136

raise

137

138

def find_next_indent(code):

138

def find_next_indent(code):

139

"""Find the number of spaces for the next line of indentation"""

139

"""Find the number of spaces for the next line of indentation"""

140

tokens = list(partial_tokens(code))

140

tokens = list(partial_tokens(code))

141

if tokens[-1].type == tokenize.ENDMARKER:

141

if tokens[-1].type == tokenize.ENDMARKER:

142

tokens.pop()

142

tokens.pop()

143

if not tokens:

143

if not tokens:

144

return 0

144

return 0

145

if tokens[-1].type in {tokenize.DEDENT, tokenize.NEWLINE, tokenize.COMMENT}:

145

if tokens[-1].type in {tokenize.DEDENT, tokenize.NEWLINE, tokenize.COMMENT}:

146

tokens.pop()

146

tokens.pop()

147

148

if tokens[-1].type == INCOMPLETE_STRING:

148

if tokens[-1].type == INCOMPLETE_STRING:

149

# Inside a multiline string

149

# Inside a multiline string

150

return 0

150

return 0

151

152

# Find the indents used before

152

# Find the indents used before

153

prev_indents = [0]

153

prev_indents = [0]

154

def _add_indent(n):

154

def _add_indent(n):

155

if n != prev_indents[-1]:

155

if n != prev_indents[-1]:

156

prev_indents.append(n)

156

prev_indents.append(n)

157

158

tokiter = iter(tokens)

158

tokiter = iter(tokens)

159

for tok in tokiter:

159

for tok in tokiter:

160

if tok.type in {tokenize.INDENT, tokenize.DEDENT}:

160

if tok.type in {tokenize.INDENT, tokenize.DEDENT}:

161

_add_indent(tok.end[1])

161

_add_indent(tok.end[1])

162

elif (tok.type == tokenize.NL):

162

elif (tok.type == tokenize.NL):

163

try:

163

try:

164

_add_indent(next(tokiter).start[1])

164

_add_indent(next(tokiter).start[1])

165

except StopIteration:

165

except StopIteration:

166

break

166

break

167

168

last_indent = prev_indents.pop()

168

last_indent = prev_indents.pop()

169

170

# If we've just opened a multiline statement (e.g. 'a = ['), indent more

170

if tokens[-1].type == IN_MULTILINE_STATEMENT:

171

if tokens[-1].type == IN_MULTILINE_STATEMENT:

171

if tokens[-2].exact_type in {tokenize.LPAR, tokenize.LSQB, tokenize.LBRACE}:

172

if tokens[-2].exact_type in {tokenize.LPAR, tokenize.LSQB, tokenize.LBRACE}:

172

return last_indent + 4

173

return last_indent + 4

173

return last_indent

174

return last_indent

174

175

if tokens[-1].exact_type == tokenize.COLON:

176

if tokens[-1].exact_type == tokenize.COLON:

176

# Line ends with colon - indent

177

# Line ends with colon - indent

177

return last_indent + 4

178

return last_indent + 4

178

179

if last_indent:

180

if last_indent:

180

# Examine the last line for dedent cues - statements like return or

181

# Examine the last line for dedent cues - statements like return or

181

# raise which normally end a block of code.

182

# raise which normally end a block of code.

182

last_line_starts = 0

183

last_line_starts = 0

183

for i, tok in enumerate(tokens):

184

for i, tok in enumerate(tokens):

184

if tok.type == tokenize.NEWLINE:

185

if tok.type == tokenize.NEWLINE:

185

last_line_starts = i + 1

186

last_line_starts = i + 1

186

187

last_line_tokens = tokens[last_line_starts:]

188

last_line_tokens = tokens[last_line_starts:]

188

names = [t.string for t in last_line_tokens if t.type == tokenize.NAME]

189

names = [t.string for t in last_line_tokens if t.type == tokenize.NAME]

189

if names and names[0] in {'raise', 'return', 'pass', 'break', 'continue'}:

190

if names and names[0] in {'raise', 'return', 'pass', 'break', 'continue'}:

190

# Find the most recent indentation less than the current level

191

# Find the most recent indentation less than the current level

191

for indent in reversed(prev_indents):

192

for indent in reversed(prev_indents):

192

if indent < last_indent:

193

if indent < last_indent:

193

return indent

194

return indent

194

195

return last_indent

196

return last_indent

196

197

198

def last_blank(src):

199

def last_blank(src):

199

"""Determine if the input source ends in a blank.

200

"""Determine if the input source ends in a blank.

200

201

A blank is either a newline or a line consisting of whitespace.

202

A blank is either a newline or a line consisting of whitespace.

202

203

Parameters

204

Parameters

204

----------

205

----------

205

src : string

206

src : string

206

A single or multiline string.

207

A single or multiline string.

207

"""

208

"""

208

if not src: return False

209

if not src: return False

209

ll = src.splitlines()[-1]

210

ll = src.splitlines()[-1]

210

return (ll == '') or ll.isspace()

211

return (ll == '') or ll.isspace()

211

212

213

last_two_blanks_re = re.compile(r'\n\s*\n\s*$', re.MULTILINE)

214

last_two_blanks_re = re.compile(r'\n\s*\n\s*$', re.MULTILINE)

214

last_two_blanks_re2 = re.compile(r'.+\n\s*\n\s+$', re.MULTILINE)

215

last_two_blanks_re2 = re.compile(r'.+\n\s*\n\s+$', re.MULTILINE)

215

216

def last_two_blanks(src):

217

def last_two_blanks(src):

217

"""Determine if the input source ends in two blanks.

218

"""Determine if the input source ends in two blanks.

218

219

A blank is either a newline or a line consisting of whitespace.

220

A blank is either a newline or a line consisting of whitespace.

220

221

Parameters

222

Parameters

222

----------

223

----------

223

src : string

224

src : string

224

A single or multiline string.

225

A single or multiline string.

225

"""

226

"""

226

if not src: return False

227

if not src: return False

227

# The logic here is tricky: I couldn't get a regexp to work and pass all

228

# The logic here is tricky: I couldn't get a regexp to work and pass all

228

# the tests, so I took a different approach: split the source by lines,

229

# the tests, so I took a different approach: split the source by lines,

229

# grab the last two and prepend '###\n' as a stand-in for whatever was in

230

# grab the last two and prepend '###\n' as a stand-in for whatever was in

230

# the body before the last two lines. Then, with that structure, it's

231

# the body before the last two lines. Then, with that structure, it's

231

# possible to analyze with two regexps. Not the most elegant solution, but

232

# possible to analyze with two regexps. Not the most elegant solution, but

232

# it works. If anyone tries to change this logic, make sure to validate

233

# it works. If anyone tries to change this logic, make sure to validate

233

# the whole test suite first!

234

# the whole test suite first!

234

new_src = '\n'.join(['###\n'] + src.splitlines()[-2:])

235

new_src = '\n'.join(['###\n'] + src.splitlines()[-2:])

235

return (bool(last_two_blanks_re.match(new_src)) or

236

return (bool(last_two_blanks_re.match(new_src)) or

236

bool(last_two_blanks_re2.match(new_src)) )

237

bool(last_two_blanks_re2.match(new_src)) )

237

238

239

def remove_comments(src):

240

def remove_comments(src):

240

"""Remove all comments from input source.

241

"""Remove all comments from input source.

241

242

Note: comments are NOT recognized inside of strings!

243

Note: comments are NOT recognized inside of strings!

243

244

Parameters

245

Parameters

245

----------

246

----------

246

src : string

247

src : string

247

A single or multiline input string.

248

A single or multiline input string.

248

249

Returns

250

Returns

250

-------

251

-------

251

String with all Python comments removed.

252

String with all Python comments removed.

252

"""

253

"""

253

254

return re.sub('#.*', '', src)

255

return re.sub('#.*', '', src)

255

256

257

def get_input_encoding():

258

def get_input_encoding():

258

"""Return the default standard input encoding.

259

"""Return the default standard input encoding.

259

260

If sys.stdin has no encoding, 'ascii' is returned."""

261

If sys.stdin has no encoding, 'ascii' is returned."""

261

# There are strange environments for which sys.stdin.encoding is None. We

262

# There are strange environments for which sys.stdin.encoding is None. We

262

# ensure that a valid encoding is returned.

263

# ensure that a valid encoding is returned.

263

encoding = getattr(sys.stdin, 'encoding', None)

264

encoding = getattr(sys.stdin, 'encoding', None)

264

if encoding is None:

265

if encoding is None:

265

encoding = 'ascii'

266

encoding = 'ascii'

266

return encoding

267

return encoding

267

268

#-----------------------------------------------------------------------------

269

#-----------------------------------------------------------------------------

269

# Classes and functions for normal Python syntax handling

270

# Classes and functions for normal Python syntax handling

270

#-----------------------------------------------------------------------------

271

#-----------------------------------------------------------------------------

271

272

class InputSplitter(object):

273

class InputSplitter(object):

273

r"""An object that can accumulate lines of Python source before execution.

274

r"""An object that can accumulate lines of Python source before execution.

274

275

This object is designed to be fed python source line-by-line, using

276

This object is designed to be fed python source line-by-line, using

276

:meth:`push`. It will return on each push whether the currently pushed

277

:meth:`push`. It will return on each push whether the currently pushed

277

code could be executed already. In addition, it provides a method called

278

code could be executed already. In addition, it provides a method called

278

:meth:`push_accepts_more` that can be used to query whether more input

279

:meth:`push_accepts_more` that can be used to query whether more input

279

can be pushed into a single interactive block.

280

can be pushed into a single interactive block.

280

281

This is a simple example of how an interactive terminal-based client can use

282

This is a simple example of how an interactive terminal-based client can use

282

this tool::

283

this tool::

283

284

isp = InputSplitter()

285

isp = InputSplitter()

285

while isp.push_accepts_more():

286

while isp.push_accepts_more():

286

indent = ' '*isp.indent_spaces

287

indent = ' '*isp.indent_spaces

287

prompt = '>>> ' + indent

288

prompt = '>>> ' + indent

288

line = indent + raw_input(prompt)

289

line = indent + raw_input(prompt)

289

isp.push(line)

290

isp.push(line)

290

print 'Input source was:\n', isp.source_reset(),

291

print 'Input source was:\n', isp.source_reset(),

291

"""

292

"""

292

# Number of spaces of indentation computed from input that has been pushed

293

# Number of spaces of indentation computed from input that has been pushed

293

# so far. This is the attributes callers should query to get the current

294

# so far. This is the attributes callers should query to get the current

294

# indentation level, in order to provide auto-indent facilities.

295

# indentation level, in order to provide auto-indent facilities.

295

indent_spaces = 0

296

indent_spaces = 0

296

# String, indicating the default input encoding. It is computed by default

297

# String, indicating the default input encoding. It is computed by default

297

# at initialization time via get_input_encoding(), but it can be reset by a

298

# at initialization time via get_input_encoding(), but it can be reset by a

298

# client with specific knowledge of the encoding.

299

# client with specific knowledge of the encoding.

299

encoding = ''

300

encoding = ''

300

# String where the current full source input is stored, properly encoded.

301

# String where the current full source input is stored, properly encoded.

301

# Reading this attribute is the normal way of querying the currently pushed

302

# Reading this attribute is the normal way of querying the currently pushed

302

# source code, that has been properly encoded.

303

# source code, that has been properly encoded.

303

source = ''

304

source = ''

304

# Code object corresponding to the current source. It is automatically

305

# Code object corresponding to the current source. It is automatically

305

# synced to the source, so it can be queried at any time to obtain the code

306

# synced to the source, so it can be queried at any time to obtain the code

306

# object; it will be None if the source doesn't compile to valid Python.

307

# object; it will be None if the source doesn't compile to valid Python.

307

code = None

308

code = None

308

309

# Private attributes

310

# Private attributes

310

311

# List with lines of input accumulated so far

312

# List with lines of input accumulated so far

312

_buffer = None

313

_buffer = None

313

# Command compiler

314

# Command compiler

314

_compile = None

315

_compile = None

315

# Mark when input has changed indentation all the way back to flush-left

316

# Mark when input has changed indentation all the way back to flush-left

316

_full_dedent = False

317

_full_dedent = False

317

# Boolean indicating whether the current block is complete

318

# Boolean indicating whether the current block is complete

318

_is_complete = None

319

_is_complete = None

319

# Boolean indicating whether the current block has an unrecoverable syntax error

320

# Boolean indicating whether the current block has an unrecoverable syntax error

320

_is_invalid = False

321

_is_invalid = False

321

322

def __init__(self):

323

def __init__(self):

323

"""Create a new InputSplitter instance.

324

"""Create a new InputSplitter instance.

324

"""

325

"""

325

self._buffer = []

326

self._buffer = []

326

self._compile = codeop.CommandCompiler()

327

self._compile = codeop.CommandCompiler()

327

self.encoding = get_input_encoding()

328

self.encoding = get_input_encoding()

328

329

def reset(self):

330

def reset(self):

330

"""Reset the input buffer and associated state."""

331

"""Reset the input buffer and associated state."""

331

self.indent_spaces = 0

332

self.indent_spaces = 0

332

self._buffer[:] = []

333

self._buffer[:] = []

333

self.source = ''

334

self.source = ''

334

self.code = None

335

self.code = None

335

self._is_complete = False

336

self._is_complete = False

336

self._is_invalid = False

337

self._is_invalid = False

337

self._full_dedent = False

338

self._full_dedent = False

338

339

def source_reset(self):

340

def source_reset(self):

340

"""Return the input source and perform a full reset.

341

"""Return the input source and perform a full reset.

341

"""

342

"""

342

out = self.source

343

out = self.source

343

self.reset()

344

self.reset()

344

return out

345

return out

345

346

def check_complete(self, source):

347

def check_complete(self, source):

347

"""Return whether a block of code is ready to execute, or should be continued

348

"""Return whether a block of code is ready to execute, or should be continued

348

349

This is a non-stateful API, and will reset the state of this InputSplitter.

350

This is a non-stateful API, and will reset the state of this InputSplitter.

350

351

Parameters

352

Parameters

352

----------

353

----------

353

source : string

354

source : string

354

Python input code, which can be multiline.

355

Python input code, which can be multiline.

355

356

Returns

357

Returns

357

-------

358

-------

358

status : str

359

status : str

359

One of 'complete', 'incomplete', or 'invalid' if source is not a

360

One of 'complete', 'incomplete', or 'invalid' if source is not a

360

prefix of valid code.

361

prefix of valid code.

361

indent_spaces : int or None

362

indent_spaces : int or None

362

The number of spaces by which to indent the next line of code. If

363

The number of spaces by which to indent the next line of code. If

363

status is not 'incomplete', this is None.

364

status is not 'incomplete', this is None.

364

"""

365

"""

365

self.reset()

366

self.reset()

366

try:

367

try:

367

self.push(source)

368

self.push(source)

368

except SyntaxError:

369

except SyntaxError:

369

# Transformers in IPythonInputSplitter can raise SyntaxError,

370

# Transformers in IPythonInputSplitter can raise SyntaxError,

370

# which push() will not catch.

371

# which push() will not catch.

371

return 'invalid', None

372

return 'invalid', None

372

else:

373

else:

373

if self._is_invalid:

374

if self._is_invalid:

374

return 'invalid', None

375

return 'invalid', None

375

elif self.push_accepts_more():

376

elif self.push_accepts_more():

376

return 'incomplete', self.indent_spaces

377

return 'incomplete', self.indent_spaces

377

else:

378

else:

378

return 'complete', None

379

return 'complete', None

379

finally:

380

finally:

380

self.reset()

381

self.reset()

381

382

def push(self, lines):

383

def push(self, lines):

383

"""Push one or more lines of input.

384

"""Push one or more lines of input.

384

385

This stores the given lines and returns a status code indicating

386

This stores the given lines and returns a status code indicating

386

whether the code forms a complete Python block or not.

387

whether the code forms a complete Python block or not.

387

388

Any exceptions generated in compilation are swallowed, but if an

389

Any exceptions generated in compilation are swallowed, but if an

389

exception was produced, the method returns True.

390

exception was produced, the method returns True.

390

391

Parameters

392

Parameters

392

----------

393

----------

393

lines : string

394

lines : string

394

One or more lines of Python input.

395

One or more lines of Python input.

395

396

Returns

397

Returns

397

-------

398

-------

398

is_complete : boolean

399

is_complete : boolean

399

True if the current input source (the result of the current input

400

True if the current input source (the result of the current input

400

plus prior inputs) forms a complete Python execution block. Note that

401

plus prior inputs) forms a complete Python execution block. Note that

401

this value is also stored as a private attribute (``_is_complete``), so it

402

this value is also stored as a private attribute (``_is_complete``), so it

402

can be queried at any time.

403

can be queried at any time.

403

"""

404

"""

404

self._store(lines)

405

self._store(lines)

405

source = self.source

406

source = self.source

406

407

# Before calling _compile(), reset the code object to None so that if an

408

# Before calling _compile(), reset the code object to None so that if an

408

# exception is raised in compilation, we don't mislead by having

409

# exception is raised in compilation, we don't mislead by having

409

# inconsistent code/source attributes.

410

# inconsistent code/source attributes.

410

self.code, self._is_complete = None, None

411

self.code, self._is_complete = None, None

411

self._is_invalid = False

412

self._is_invalid = False

412

413

# Honor termination lines properly

414

# Honor termination lines properly

414

if source.endswith('\\\n'):

415

if source.endswith('\\\n'):

415

return False

416

return False

416

417

self._update_indent()

418

self._update_indent()

418

try:

419

try:

419

with warnings.catch_warnings():

420

with warnings.catch_warnings():

420

warnings.simplefilter('error', SyntaxWarning)

421

warnings.simplefilter('error', SyntaxWarning)

421

self.code = self._compile(source, symbol="exec")

422

self.code = self._compile(source, symbol="exec")

422

# Invalid syntax can produce any of a number of different errors from

423

# Invalid syntax can produce any of a number of different errors from

423

# inside the compiler, so we have to catch them all. Syntax errors

424

# inside the compiler, so we have to catch them all. Syntax errors

424

# immediately produce a 'ready' block, so the invalid Python can be

425

# immediately produce a 'ready' block, so the invalid Python can be

425

# sent to the kernel for evaluation with possible ipython

426

# sent to the kernel for evaluation with possible ipython

426

# special-syntax conversion.

427

# special-syntax conversion.

427

except (SyntaxError, OverflowError, ValueError, TypeError,

428

except (SyntaxError, OverflowError, ValueError, TypeError,

428

MemoryError, SyntaxWarning):

429

MemoryError, SyntaxWarning):

429

self._is_complete = True

430

self._is_complete = True

430

self._is_invalid = True

431

self._is_invalid = True

431

else:

432

else:

432

# Compilation didn't produce any exceptions (though it may not have

433

# Compilation didn't produce any exceptions (though it may not have

433

# given a complete code object)

434

# given a complete code object)

434

self._is_complete = self.code is not None

435

self._is_complete = self.code is not None

435

436

return self._is_complete

437

return self._is_complete

437

438

def push_accepts_more(self):

439

def push_accepts_more(self):

439

"""Return whether a block of interactive input can accept more input.

440

"""Return whether a block of interactive input can accept more input.

440

441

This method is meant to be used by line-oriented frontends, who need to

442

This method is meant to be used by line-oriented frontends, who need to

442

guess whether a block is complete or not based solely on prior and

443

guess whether a block is complete or not based solely on prior and

443

current input lines. The InputSplitter considers it has a complete

444

current input lines. The InputSplitter considers it has a complete

444

interactive block and will not accept more input when either:

445

interactive block and will not accept more input when either:

445

446

* A SyntaxError is raised

447

* A SyntaxError is raised

447

448

* The code is complete and consists of a single line or a single

449

* The code is complete and consists of a single line or a single

449

non-compound statement

450

non-compound statement

450

451

* The code is complete and has a blank line at the end

452

* The code is complete and has a blank line at the end

452

453

If the current input produces a syntax error, this method immediately

454

If the current input produces a syntax error, this method immediately

454

returns False but does *not* raise the syntax error exception, as

455

returns False but does *not* raise the syntax error exception, as

455

typically clients will want to send invalid syntax to an execution

456

typically clients will want to send invalid syntax to an execution

456

backend which might convert the invalid syntax into valid Python via

457

backend which might convert the invalid syntax into valid Python via

457

one of the dynamic IPython mechanisms.

458

one of the dynamic IPython mechanisms.

458

"""

459

"""

459

460

# With incomplete input, unconditionally accept more

461

# With incomplete input, unconditionally accept more

461

# A syntax error also sets _is_complete to True - see push()

462

# A syntax error also sets _is_complete to True - see push()

462

if not self._is_complete:

463

if not self._is_complete:

463

#print("Not complete") # debug

464

#print("Not complete") # debug

464

return True

465

return True

465

466

# The user can make any (complete) input execute by leaving a blank line

467

# The user can make any (complete) input execute by leaving a blank line

467

last_line = self.source.splitlines()[-1]

468

last_line = self.source.splitlines()[-1]

468

if (not last_line) or last_line.isspace():

469

if (not last_line) or last_line.isspace():

469

#print("Blank line") # debug

470

#print("Blank line") # debug

470

return False

471

return False

471

472

# If there's just a single line or AST node, and we're flush left, as is

473

# If there's just a single line or AST node, and we're flush left, as is

473

# the case after a simple statement such as 'a=1', we want to execute it

474

# the case after a simple statement such as 'a=1', we want to execute it

474

# straight away.

475

# straight away.

475

if self.indent_spaces==0:

476

if self.indent_spaces==0:

476

if len(self.source.splitlines()) <= 1:

477

if len(self.source.splitlines()) <= 1:

477

return False

478

return False

478

479

try:

480

try:

480

code_ast = ast.parse(u''.join(self._buffer))

481

code_ast = ast.parse(u''.join(self._buffer))

481

except Exception:

482

except Exception:

482

#print("Can't parse AST") # debug

483

#print("Can't parse AST") # debug

483

return False

484

return False

484

else:

485

else:

485

if len(code_ast.body) == 1 and \

486

if len(code_ast.body) == 1 and \

486

not hasattr(code_ast.body[0], 'body'):

487

not hasattr(code_ast.body[0], 'body'):

487

#print("Simple statement") # debug

488

#print("Simple statement") # debug

488

return False

489

return False

489

490

# General fallback - accept more code

491

# General fallback - accept more code

491

return True

492

return True

492

493

def _update_indent(self):

494

def _update_indent(self):

494

# self.source always has a trailing newline

495

# self.source always has a trailing newline

495

self.indent_spaces = find_next_indent(self.source[:-1])

496

self.indent_spaces = find_next_indent(self.source[:-1])

496

self._full_dedent = (self.indent_spaces == 0)

497

self._full_dedent = (self.indent_spaces == 0)

497

498

def _store(self, lines, buffer=None, store='source'):

499

def _store(self, lines, buffer=None, store='source'):

499

"""Store one or more lines of input.

500

"""Store one or more lines of input.

500

501

If input lines are not newline-terminated, a newline is automatically

502

If input lines are not newline-terminated, a newline is automatically

502

appended."""

503

appended."""

503

504

if buffer is None:

505

if buffer is None:

505

buffer = self._buffer

506

buffer = self._buffer

506

507

if lines.endswith('\n'):

508

if lines.endswith('\n'):

508

buffer.append(lines)

509

buffer.append(lines)

509

else:

510

else:

510

buffer.append(lines+'\n')

511

buffer.append(lines+'\n')

511

setattr(self, store, self._set_source(buffer))

512

setattr(self, store, self._set_source(buffer))

512

513

def _set_source(self, buffer):

514

def _set_source(self, buffer):

514

return u''.join(buffer)

515

return u''.join(buffer)

515

516

517

class IPythonInputSplitter(InputSplitter):

518

class IPythonInputSplitter(InputSplitter):

518

"""An input splitter that recognizes all of IPython's special syntax."""

519

"""An input splitter that recognizes all of IPython's special syntax."""

519

520

# String with raw, untransformed input.

521

# String with raw, untransformed input.

521

source_raw = ''

522

source_raw = ''

522

523

# Flag to track when a transformer has stored input that it hasn't given

524

# Flag to track when a transformer has stored input that it hasn't given

524

# back yet.

525

# back yet.

525

transformer_accumulating = False

526

transformer_accumulating = False

526

527

# Flag to track when assemble_python_lines has stored input that it hasn't

528

# Flag to track when assemble_python_lines has stored input that it hasn't

528

# given back yet.

529

# given back yet.

529

within_python_line = False

530

within_python_line = False

530

531

# Private attributes

532

# Private attributes

532

533

# List with lines of raw input accumulated so far.

534

# List with lines of raw input accumulated so far.

534

_buffer_raw = None

535

_buffer_raw = None

535

536

def __init__(self, line_input_checker=True, physical_line_transforms=None,

537

def __init__(self, line_input_checker=True, physical_line_transforms=None,

537

logical_line_transforms=None, python_line_transforms=None):

538

logical_line_transforms=None, python_line_transforms=None):

538

super(IPythonInputSplitter, self).__init__()

539

super(IPythonInputSplitter, self).__init__()

539

self._buffer_raw = []

540

self._buffer_raw = []

540

self._validate = True

541

self._validate = True

541

542

if physical_line_transforms is not None:

543

if physical_line_transforms is not None:

543

self.physical_line_transforms = physical_line_transforms

544

self.physical_line_transforms = physical_line_transforms

544

else:

545

else:

545

self.physical_line_transforms = [

546

self.physical_line_transforms = [

546

leading_indent(),

547

leading_indent(),

547

classic_prompt(),

548

classic_prompt(),

548

ipy_prompt(),

549

ipy_prompt(),

549

cellmagic(end_on_blank_line=line_input_checker),

550

cellmagic(end_on_blank_line=line_input_checker),

550

]

551

]

551

552

self.assemble_logical_lines = assemble_logical_lines()

553

self.assemble_logical_lines = assemble_logical_lines()

553

if logical_line_transforms is not None:

554

if logical_line_transforms is not None:

554

self.logical_line_transforms = logical_line_transforms

555

self.logical_line_transforms = logical_line_transforms

555

else:

556

else:

556

self.logical_line_transforms = [

557

self.logical_line_transforms = [

557

help_end(),

558

help_end(),

558

escaped_commands(),

559

escaped_commands(),

559

assign_from_magic(),

560

assign_from_magic(),

560

assign_from_system(),

561

assign_from_system(),

561

]

562

]

562

563

self.assemble_python_lines = assemble_python_lines()

564

self.assemble_python_lines = assemble_python_lines()

564

if python_line_transforms is not None:

565

if python_line_transforms is not None:

565

self.python_line_transforms = python_line_transforms

566

self.python_line_transforms = python_line_transforms

566

else:

567

else:

567

# We don't use any of these at present

568

# We don't use any of these at present

568

self.python_line_transforms = []

569

self.python_line_transforms = []

569

570

@property

571

@property

571

def transforms(self):

572

def transforms(self):

572

"Quick access to all transformers."

573

"Quick access to all transformers."

573

return self.physical_line_transforms + \

574

return self.physical_line_transforms + \

574

[self.assemble_logical_lines] + self.logical_line_transforms + \

575

[self.assemble_logical_lines] + self.logical_line_transforms + \

575

[self.assemble_python_lines] + self.python_line_transforms

576

[self.assemble_python_lines] + self.python_line_transforms

576

577

@property

578

@property

578

def transforms_in_use(self):

579

def transforms_in_use(self):

579

"""Transformers, excluding logical line transformers if we're in a

580

"""Transformers, excluding logical line transformers if we're in a

580

Python line."""

581

Python line."""

581

t = self.physical_line_transforms[:]

582

t = self.physical_line_transforms[:]

582

if not self.within_python_line:

583

if not self.within_python_line:

583

t += [self.assemble_logical_lines] + self.logical_line_transforms

584

t += [self.assemble_logical_lines] + self.logical_line_transforms

584

return t + [self.assemble_python_lines] + self.python_line_transforms

585

return t + [self.assemble_python_lines] + self.python_line_transforms

585

586

def reset(self):

587

def reset(self):

587

"""Reset the input buffer and associated state."""

588

"""Reset the input buffer and associated state."""

588

super(IPythonInputSplitter, self).reset()

589

super(IPythonInputSplitter, self).reset()

589

self._buffer_raw[:] = []

590

self._buffer_raw[:] = []

590

self.source_raw = ''

591

self.source_raw = ''

591

self.transformer_accumulating = False

592

self.transformer_accumulating = False

592

self.within_python_line = False

593

self.within_python_line = False

593

594

for t in self.transforms:

595

for t in self.transforms:

595

try:

596

try:

596

t.reset()

597

t.reset()

597

except SyntaxError:

598

except SyntaxError:

598

# Nothing that calls reset() expects to handle transformer

599

# Nothing that calls reset() expects to handle transformer

599

# errors

600

# errors

600

pass

601

pass

601

602

def flush_transformers(self):

603

def flush_transformers(self):

603

def _flush(transform, outs):

604

def _flush(transform, outs):

604

"""yield transformed lines

605

"""yield transformed lines

605

606

always strings, never None

607

always strings, never None

607

608

transform: the current transform

609

transform: the current transform

609

outs: an iterable of previously transformed inputs.

610

outs: an iterable of previously transformed inputs.

610

Each may be multiline, which will be passed

611

Each may be multiline, which will be passed

611

one line at a time to transform.

612

one line at a time to transform.

612

"""

613

"""

613

for out in outs:

614

for out in outs:

614

for line in out.splitlines():

615

for line in out.splitlines():

615

# push one line at a time

616

# push one line at a time

616

tmp = transform.push(line)

617

tmp = transform.push(line)

617

if tmp is not None:

618

if tmp is not None:

618

yield tmp

619

yield tmp

619

620

# reset the transform

621

# reset the transform

621

tmp = transform.reset()

622

tmp = transform.reset()

622

if tmp is not None:

623

if tmp is not None:

623

yield tmp

624

yield tmp

624

625

out = []

626

out = []

626

for t in self.transforms_in_use:

627

for t in self.transforms_in_use:

627

out = _flush(t, out)

628

out = _flush(t, out)

628

629

out = list(out)

630

out = list(out)

630

if out:

631

if out:

631

self._store('\n'.join(out))

632

self._store('\n'.join(out))

632

633

def raw_reset(self):

634

def raw_reset(self):

634

"""Return raw input only and perform a full reset.

635

"""Return raw input only and perform a full reset.

635

"""

636

"""

636

out = self.source_raw

637

out = self.source_raw

637

self.reset()

638

self.reset()

638

return out

639

return out

639

640

def source_reset(self):

641

def source_reset(self):

641

try:

642

try:

642

self.flush_transformers()

643

self.flush_transformers()

643

return self.source

644

return self.source

644

finally:

645

finally:

645

self.reset()

646

self.reset()

646

647

def push_accepts_more(self):

648

def push_accepts_more(self):

648

if self.transformer_accumulating:

649

if self.transformer_accumulating:

649

return True

650

return True

650

else:

651

else:

651

return super(IPythonInputSplitter, self).push_accepts_more()

652

return super(IPythonInputSplitter, self).push_accepts_more()

652

653

def transform_cell(self, cell):

654

def transform_cell(self, cell):

654

"""Process and translate a cell of input.

655

"""Process and translate a cell of input.

655

"""

656

"""

656

self.reset()

657

self.reset()

657

try:

658

try:

658

self.push(cell)

659

self.push(cell)

659

self.flush_transformers()

660

self.flush_transformers()

660

return self.source

661

return self.source

661

finally:

662

finally:

662

self.reset()

663

self.reset()

663

664

def push(self, lines):

665

def push(self, lines):

665

"""Push one or more lines of IPython input.

666

"""Push one or more lines of IPython input.

666

667

This stores the given lines and returns a status code indicating

668

This stores the given lines and returns a status code indicating

668

whether the code forms a complete Python block or not, after processing

669

whether the code forms a complete Python block or not, after processing

669

all input lines for special IPython syntax.

670

all input lines for special IPython syntax.

670

671

Any exceptions generated in compilation are swallowed, but if an

672

Any exceptions generated in compilation are swallowed, but if an

672

exception was produced, the method returns True.

673

exception was produced, the method returns True.

673

674

Parameters

675

Parameters

675

----------

676

----------

676

lines : string

677

lines : string

677

One or more lines of Python input.

678

One or more lines of Python input.

678

679

Returns

680

Returns

680

-------

681

-------

681

is_complete : boolean

682

is_complete : boolean

682

True if the current input source (the result of the current input

683

True if the current input source (the result of the current input

683

plus prior inputs) forms a complete Python execution block. Note that

684

plus prior inputs) forms a complete Python execution block. Note that

684

this value is also stored as a private attribute (_is_complete), so it

685

this value is also stored as a private attribute (_is_complete), so it

685

can be queried at any time.

686

can be queried at any time.

686

"""

687

"""

687

688

# We must ensure all input is pure unicode

689

# We must ensure all input is pure unicode

689

lines = cast_unicode(lines, self.encoding)

690

lines = cast_unicode(lines, self.encoding)

690

# ''.splitlines() --> [], but we need to push the empty line to transformers

691

# ''.splitlines() --> [], but we need to push the empty line to transformers

691

lines_list = lines.splitlines()

692

lines_list = lines.splitlines()

692

if not lines_list:

693

if not lines_list:

693

lines_list = ['']

694

lines_list = ['']

694

695

# Store raw source before applying any transformations to it. Note

696

# Store raw source before applying any transformations to it. Note

696

# that this must be done *after* the reset() call that would otherwise

697

# that this must be done *after* the reset() call that would otherwise

697

# flush the buffer.

698

# flush the buffer.

698

self._store(lines, self._buffer_raw, 'source_raw')

699

self._store(lines, self._buffer_raw, 'source_raw')

699

700

for line in lines_list:

701

for line in lines_list:

701

out = self.push_line(line)

702

out = self.push_line(line)

702

703

return out

704

return out

704

705

def push_line(self, line):

706

def push_line(self, line):

706

buf = self._buffer

707

buf = self._buffer

707

708

def _accumulating(dbg):

709

def _accumulating(dbg):

709

#print(dbg)

710

#print(dbg)

710

self.transformer_accumulating = True

711

self.transformer_accumulating = True

711

return False

712

return False

712

713

for transformer in self.physical_line_transforms:

714

for transformer in self.physical_line_transforms:

714

line = transformer.push(line)

715

line = transformer.push(line)

715

if line is None:

716

if line is None:

716

return _accumulating(transformer)

717

return _accumulating(transformer)

717

718

if not self.within_python_line:

719

if not self.within_python_line:

719

line = self.assemble_logical_lines.push(line)

720

line = self.assemble_logical_lines.push(line)

720

if line is None:

721

if line is None:

721

return _accumulating('acc logical line')

722

return _accumulating('acc logical line')

722

723

for transformer in self.logical_line_transforms:

724

for transformer in self.logical_line_transforms:

724

line = transformer.push(line)

725

line = transformer.push(line)

725

if line is None:

726

if line is None:

726

return _accumulating(transformer)

727

return _accumulating(transformer)

727

728

line = self.assemble_python_lines.push(line)

729

line = self.assemble_python_lines.push(line)

729

if line is None:

730

if line is None:

730

self.within_python_line = True

731

self.within_python_line = True

731

return _accumulating('acc python line')

732

return _accumulating('acc python line')

732

else:

733

else:

733

self.within_python_line = False

734

self.within_python_line = False

734

735

for transformer in self.python_line_transforms:

736

for transformer in self.python_line_transforms:

736

line = transformer.push(line)

737

line = transformer.push(line)

737

if line is None:

738

if line is None:

738

return _accumulating(transformer)

739

return _accumulating(transformer)

739

740

#print("transformers clear") #debug

741

#print("transformers clear") #debug

741

self.transformer_accumulating = False

742

self.transformer_accumulating = False

742

return super(IPythonInputSplitter, self).push(line)

743

return super(IPythonInputSplitter, self).push(line)

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages

             """Input handling and transformation machinery.
             The first class in this module, :class:`InputSplitter`, is designed to tell when
             input from a line-oriented frontend is complete and should be executed, and when
             the user should be prompted for another line of code instead. The name 'input
             splitter' is largely for historical reasons.
             A companion, :class:`IPythonInputSplitter`, provides the same functionality but
             with full support for the extended IPython syntax (magics, system calls, etc).
             The code to actually do these transformations is in :mod:`IPython.core.inputtransformer`.
             :class:`IPythonInputSplitter` feeds the raw code to the transformers in order
             and stores the results.
             For more details, see the class docstrings below.
             """
             # Copyright (c) IPython Development Team.
             # Distributed under the terms of the Modified BSD License.
             import ast
             import codeop
             import io
             import re
             import sys
             import tokenize
             import warnings
             from IPython.utils.py3compat import cast_unicode
             from IPython.core.inputtransformer import (leading_indent,
                                                        classic_prompt,
                                                        ipy_prompt,
                                                        cellmagic,
                                                        assemble_logical_lines,
                                                        help_end,
                                                        escaped_commands,
                                                        assign_from_magic,
                                                        assign_from_system,
                                                        assemble_python_lines,
                                                        )
             # These are available in this module for backwards compatibility.
             from IPython.core.inputtransformer import (ESC_SHELL, ESC_SH_CAP, ESC_HELP,
                                                     ESC_HELP2, ESC_MAGIC, ESC_MAGIC2,
                                                     ESC_QUOTE, ESC_QUOTE2, ESC_PAREN, ESC_SEQUENCES)
             #-----------------------------------------------------------------------------
             # Utilities
             #-----------------------------------------------------------------------------
             # FIXME: These are general-purpose utilities that later can be moved to the
             # general ward.  Kept here for now because we're being very strict about test
             # coverage with this code, and this lets us ensure that we keep 100% coverage
             # while developing.
             # compiled regexps for autoindent management
             dedent_re = re.compile('|'.join([
                 r'^\s+raise(\s.*)?$', # raise statement (+ space + other stuff, maybe)
                 r'^\s+raise\([^\)]*\).*$', # wacky raise with immediate open paren
                 r'^\s+return(\s.*)?$', # normal return (+ space + other stuff, maybe)
                 r'^\s+return\([^\)]*\).*$', # wacky return with immediate open paren
                 r'^\s+pass\s*$', # pass (optionally followed by trailing spaces)
                 r'^\s+break\s*$', # break (optionally followed by trailing spaces)
                 r'^\s+continue\s*$', # continue (optionally followed by trailing spaces)
             ]))
             ini_spaces_re = re.compile(r'^([ \t\r\f\v]+)')
             # regexp to match pure comment lines so we don't accidentally insert 'if 1:'
             # before pure comments
             comment_line_re = re.compile('^\s*\#')
             def num_ini_spaces(s):
                 """Return the number of initial spaces in a string.
                 Note that tabs are counted as a single space.  For now, we do *not* support
                 mixing of tabs and spaces in the user's input.
                 Parameters
                 ----------
                 s : string
                 Returns
                 -------
                 n : int
                 """
                 ini_spaces = ini_spaces_re.match(s)
                 if ini_spaces:
                     return ini_spaces.end()
                 else:
                     return 0
             # Fake token types for partial_tokenize:
             INCOMPLETE_STRING = tokenize.N_TOKENS
             IN_MULTILINE_STATEMENT = tokenize.N_TOKENS + 1
             # The 2 classes below have the same API as TokenInfo, but don't try to look up
             # a token type name that they won't find.
             class IncompleteString:
                 type = exact_type = INCOMPLETE_STRING
                 def __init__(self, s, start, end, line):
                     self.s = s
                     self.start = start
                     self.end = end
                     self.line = line
             class InMultilineStatement:
                 type = exact_type = IN_MULTILINE_STATEMENT
                 def __init__(self, pos, line):
                     self.s = ''
                     self.start = self.end = pos
                     self.line = line
             def partial_tokens(s):
                 """Iterate over tokens from a possibly-incomplete string of code.
                 This adds two special token types: INCOMPLETE_STRING and
                 IN_MULTILINE_STATEMENT. These can only occur as the last token yielded, and
                 represent the two main ways for code to be incomplete.
                 """
                 readline = io.StringIO(s).readline
                 token = tokenize.TokenInfo(tokenize.NEWLINE, '', (1, 0), (1, 0), '')
                 try:
                     for token in tokenize.generate_tokens(readline):
                         yield token
                 except tokenize.TokenError as e:
                     # catch EOF error
                     lines = s.splitlines(keepends=True)
                     end = len(lines), len(lines[-1])
                     if 'multi-line string' in e.args[0]:
                         l, c = start = token.end
                         s = lines[l-1][c:] + ''.join(lines[l:])
                         yield IncompleteString(s, start, end, lines[-1])
                     elif 'multi-line statement' in e.args[0]:
                         yield InMultilineStatement(end, lines[-1])
                     else:
                         raise
             def find_next_indent(code):
                 """Find the number of spaces for the next line of indentation"""
                 tokens = list(partial_tokens(code))
                 if tokens[-1].type == tokenize.ENDMARKER:
                     tokens.pop()
                 if not tokens:
                     return 0
                 if tokens[-1].type in {tokenize.DEDENT, tokenize.NEWLINE, tokenize.COMMENT}:
                     tokens.pop()
                 if tokens[-1].type == INCOMPLETE_STRING:
                     # Inside a multiline string
                     return 0
                 # Find the indents used before
                 prev_indents = [0]
                 def _add_indent(n):
                     if n != prev_indents[-1]:
                         prev_indents.append(n)
                 tokiter = iter(tokens)
                 for tok in tokiter:
                     if tok.type in {tokenize.INDENT, tokenize.DEDENT}:
                         _add_indent(tok.end[1])
                     elif (tok.type == tokenize.NL):
                         try:
                             _add_indent(next(tokiter).start[1])
                         except StopIteration:
                             break
                 last_indent = prev_indents.pop()
+                # If we've just opened a multiline statement (e.g. 'a = ['), indent more
                 if tokens[-1].type == IN_MULTILINE_STATEMENT:
                     if tokens[-2].exact_type in {tokenize.LPAR, tokenize.LSQB, tokenize.LBRACE}:
                         return last_indent + 4
                     return last_indent
                 if tokens[-1].exact_type == tokenize.COLON:
                     # Line ends with colon - indent
                     return last_indent + 4
                 if last_indent:
                     # Examine the last line for dedent cues - statements like return or
                     # raise which normally end a block of code.
                     last_line_starts = 0
                     for i, tok in enumerate(tokens):
                         if tok.type == tokenize.NEWLINE:
                             last_line_starts = i + 1
                     last_line_tokens = tokens[last_line_starts:]
                     names = [t.string for t in last_line_tokens if t.type == tokenize.NAME]
                     if names and names[0] in {'raise', 'return', 'pass', 'break', 'continue'}:
                         # Find the most recent indentation less than the current level
                         for indent in reversed(prev_indents):
                             if indent < last_indent:
                                 return indent
                 return last_indent
             def last_blank(src):
                 """Determine if the input source ends in a blank.
                 A blank is either a newline or a line consisting of whitespace.
                 Parameters
                 ----------
                 src : string
                   A single or multiline string.
                 """
                 if not src: return False
                 ll  = src.splitlines()[-1]
                 return (ll == '') or ll.isspace()
             last_two_blanks_re = re.compile(r'\n\s*\n\s*$', re.MULTILINE)
             last_two_blanks_re2 = re.compile(r'.+\n\s*\n\s+$', re.MULTILINE)
             def last_two_blanks(src):
                 """Determine if the input source ends in two blanks.
                 A blank is either a newline or a line consisting of whitespace.
                 Parameters
                 ----------
                 src : string
                   A single or multiline string.
                 """
                 if not src: return False
                 # The logic here is tricky: I couldn't get a regexp to work and pass all
                 # the tests, so I took a different approach: split the source by lines,
                 # grab the last two and prepend '###\n' as a stand-in for whatever was in
                 # the body before the last two lines.  Then, with that structure, it's
                 # possible to analyze with two regexps.  Not the most elegant solution, but
                 # it works.  If anyone tries to change this logic, make sure to validate
                 # the whole test suite first!
                 new_src = '\n'.join(['###\n'] + src.splitlines()[-2:])
                 return (bool(last_two_blanks_re.match(new_src)) or
                         bool(last_two_blanks_re2.match(new_src)) )
             def remove_comments(src):
                 """Remove all comments from input source.
                 Note: comments are NOT recognized inside of strings!
                 Parameters
                 ----------
                 src : string
                   A single or multiline input string.
                 Returns
                 -------
                 String with all Python comments removed.
                 """
                 return re.sub('#.*', '', src)
             def get_input_encoding():
                 """Return the default standard input encoding.
                 If sys.stdin has no encoding, 'ascii' is returned."""
                 # There are strange environments for which sys.stdin.encoding is None. We
                 # ensure that a valid encoding is returned.
                 encoding = getattr(sys.stdin, 'encoding', None)
                 if encoding is None:
                     encoding = 'ascii'
                 return encoding
             #-----------------------------------------------------------------------------
             # Classes and functions for normal Python syntax handling
             #-----------------------------------------------------------------------------
             class InputSplitter(object):
                 r"""An object that can accumulate lines of Python source before execution.
                 This object is designed to be fed python source line-by-line, using
                 :meth:`push`. It will return on each push whether the currently pushed
                 code could be executed already. In addition, it provides a method called
                 :meth:`push_accepts_more` that can be used to query whether more input
                 can be pushed into a single interactive block.
                 This is a simple example of how an interactive terminal-based client can use
                 this tool::
                     isp = InputSplitter()
                     while isp.push_accepts_more():
                         indent = ' '*isp.indent_spaces
                         prompt = '>>> ' + indent
                         line = indent + raw_input(prompt)
                         isp.push(line)
                     print 'Input source was:\n', isp.source_reset(),
                 """
                 # Number of spaces of indentation computed from input that has been pushed
                 # so far.  This is the attributes callers should query to get the current
                 # indentation level, in order to provide auto-indent facilities.
                 indent_spaces = 0
                 # String, indicating the default input encoding.  It is computed by default
                 # at initialization time via get_input_encoding(), but it can be reset by a
                 # client with specific knowledge of the encoding.
                 encoding = ''
                 # String where the current full source input is stored, properly encoded.
                 # Reading this attribute is the normal way of querying the currently pushed
                 # source code, that has been properly encoded.
                 source = ''
                 # Code object corresponding to the current source.  It is automatically
                 # synced to the source, so it can be queried at any time to obtain the code
                 # object; it will be None if the source doesn't compile to valid Python.
                 code = None
                 # Private attributes
                 # List with lines of input accumulated so far
                 _buffer = None
                 # Command compiler
                 _compile = None
                 # Mark when input has changed indentation all the way back to flush-left
                 _full_dedent = False
                 # Boolean indicating whether the current block is complete
                 _is_complete = None
                 # Boolean indicating whether the current block has an unrecoverable syntax error
                 _is_invalid = False
                 def __init__(self):
                     """Create a new InputSplitter instance.
                     """
                     self._buffer = []
                     self._compile = codeop.CommandCompiler()
                     self.encoding = get_input_encoding()
                 def reset(self):
                     """Reset the input buffer and associated state."""
                     self.indent_spaces = 0
                     self._buffer[:] = []
                     self.source = ''
                     self.code = None
                     self._is_complete = False
                     self._is_invalid = False
                     self._full_dedent = False
                 def source_reset(self):
                     """Return the input source and perform a full reset.
                     """
                     out = self.source
                     self.reset()
                     return out
                 def check_complete(self, source):
                     """Return whether a block of code is ready to execute, or should be continued
                     This is a non-stateful API, and will reset the state of this InputSplitter.
                     Parameters
                     ----------
                     source : string
                       Python input code, which can be multiline.
                     Returns
                     -------
                     status : str
                       One of 'complete', 'incomplete', or 'invalid' if source is not a
                       prefix of valid code.
                     indent_spaces : int or None
                       The number of spaces by which to indent the next line of code. If
                       status is not 'incomplete', this is None.
                     """
                     self.reset()
                     try:
                         self.push(source)
                     except SyntaxError:
                         # Transformers in IPythonInputSplitter can raise SyntaxError,
                         # which push() will not catch.
                         return 'invalid', None
                     else:
                         if self._is_invalid:
                             return 'invalid', None
                         elif self.push_accepts_more():
                             return 'incomplete', self.indent_spaces
                         else:
                             return 'complete', None
                     finally:
                         self.reset()
                 def push(self, lines):
                     """Push one or more lines of input.
                     This stores the given lines and returns a status code indicating
                     whether the code forms a complete Python block or not.
                     Any exceptions generated in compilation are swallowed, but if an
                     exception was produced, the method returns True.
                     Parameters
                     ----------
                     lines : string
                       One or more lines of Python input.
                     Returns
                     -------
                     is_complete : boolean
                       True if the current input source (the result of the current input
                       plus prior inputs) forms a complete Python execution block.  Note that
                       this value is also stored as a private attribute (``_is_complete``), so it
                       can be queried at any time.
                     """
                     self._store(lines)
                     source = self.source
                     # Before calling _compile(), reset the code object to None so that if an
                     # exception is raised in compilation, we don't mislead by having
                     # inconsistent code/source attributes.
                     self.code, self._is_complete = None, None
                     self._is_invalid = False
                     # Honor termination lines properly
                     if source.endswith('\\\n'):
                         return False
                     self._update_indent()
                     try:
                         with warnings.catch_warnings():
                             warnings.simplefilter('error', SyntaxWarning)
                             self.code = self._compile(source, symbol="exec")
                     # Invalid syntax can produce any of a number of different errors from
                     # inside the compiler, so we have to catch them all.  Syntax errors
                     # immediately produce a 'ready' block, so the invalid Python can be
                     # sent to the kernel for evaluation with possible ipython
                     # special-syntax conversion.
                     except (SyntaxError, OverflowError, ValueError, TypeError,
                             MemoryError, SyntaxWarning):
                         self._is_complete = True
                         self._is_invalid = True
                     else:
                         # Compilation didn't produce any exceptions (though it may not have
                         # given a complete code object)
                         self._is_complete = self.code is not None
                     return self._is_complete
                 def push_accepts_more(self):
                     """Return whether a block of interactive input can accept more input.
                     This method is meant to be used by line-oriented frontends, who need to
                     guess whether a block is complete or not based solely on prior and
                     current input lines.  The InputSplitter considers it has a complete
                     interactive block and will not accept more input when either:
                     * A SyntaxError is raised
                     * The code is complete and consists of a single line or a single
                       non-compound statement
                     * The code is complete and has a blank line at the end
                     If the current input produces a syntax error, this method immediately
                     returns False but does *not* raise the syntax error exception, as
                     typically clients will want to send invalid syntax to an execution
                     backend which might convert the invalid syntax into valid Python via
                     one of the dynamic IPython mechanisms.
                     """
                     # With incomplete input, unconditionally accept more
                     # A syntax error also sets _is_complete to True - see push()
                     if not self._is_complete:
                         #print("Not complete")  # debug
                         return True
                     # The user can make any (complete) input execute by leaving a blank line
                     last_line = self.source.splitlines()[-1]
                     if (not last_line) or last_line.isspace():
                         #print("Blank line")  # debug
                         return False
                     # If there's just a single line or AST node, and we're flush left, as is
                     # the case after a simple statement such as 'a=1', we want to execute it
                     # straight away.
                     if self.indent_spaces==0:
                         if len(self.source.splitlines()) <= 1:
                             return False
                         try:
                             code_ast = ast.parse(u''.join(self._buffer))
                         except Exception:
                             #print("Can't parse AST")  # debug
                             return False
                         else:
                             if len(code_ast.body) == 1 and \
                                                 not hasattr(code_ast.body[0], 'body'):
                                 #print("Simple statement")  # debug
                                 return False
                     # General fallback - accept more code
                     return True
                 def _update_indent(self):
                     # self.source always has a trailing newline
                     self.indent_spaces = find_next_indent(self.source[:-1])
                     self._full_dedent = (self.indent_spaces == 0)
                 def _store(self, lines, buffer=None, store='source'):
                     """Store one or more lines of input.
                     If input lines are not newline-terminated, a newline is automatically
                     appended."""
                     if buffer is None:
                         buffer = self._buffer
                     if lines.endswith('\n'):
                         buffer.append(lines)
                     else:
                         buffer.append(lines+'\n')
                     setattr(self, store, self._set_source(buffer))
                 def _set_source(self, buffer):
                     return u''.join(buffer)
             class IPythonInputSplitter(InputSplitter):
                 """An input splitter that recognizes all of IPython's special syntax."""
                 # String with raw, untransformed input.
                 source_raw = ''
                 # Flag to track when a transformer has stored input that it hasn't given
                 # back yet.
                 transformer_accumulating = False
                 # Flag to track when assemble_python_lines has stored input that it hasn't
                 # given back yet.
                 within_python_line = False
                 # Private attributes
                 # List with lines of raw input accumulated so far.
                 _buffer_raw = None
                 def __init__(self, line_input_checker=True, physical_line_transforms=None,
                                 logical_line_transforms=None, python_line_transforms=None):
                     super(IPythonInputSplitter, self).__init__()
                     self._buffer_raw = []
                     self._validate = True
                     if physical_line_transforms is not None:
                         self.physical_line_transforms = physical_line_transforms
                     else:
                         self.physical_line_transforms = [
                                                          leading_indent(),
                                                          classic_prompt(),
                                                          ipy_prompt(),
                                                          cellmagic(end_on_blank_line=line_input_checker),
                                                         ]
                     self.assemble_logical_lines = assemble_logical_lines()
                     if logical_line_transforms is not None:
                         self.logical_line_transforms = logical_line_transforms
                     else:
                         self.logical_line_transforms = [
                                                         help_end(),
                                                         escaped_commands(),
                                                         assign_from_magic(),
                                                         assign_from_system(),
                                                        ]
                     self.assemble_python_lines = assemble_python_lines()
                     if python_line_transforms is not None:
                         self.python_line_transforms = python_line_transforms
                     else:
                         # We don't use any of these at present
                         self.python_line_transforms = []
                 @property
                 def transforms(self):
                     "Quick access to all transformers."
                     return self.physical_line_transforms + \
                         [self.assemble_logical_lines] + self.logical_line_transforms + \
                         [self.assemble_python_lines]  + self.python_line_transforms
                 @property
                 def transforms_in_use(self):
                     """Transformers, excluding logical line transformers if we're in a
                     Python line."""
                     t = self.physical_line_transforms[:]
                     if not self.within_python_line:
                         t += [self.assemble_logical_lines] + self.logical_line_transforms
                     return t + [self.assemble_python_lines] + self.python_line_transforms
                 def reset(self):
                     """Reset the input buffer and associated state."""
                     super(IPythonInputSplitter, self).reset()
                     self._buffer_raw[:] = []
                     self.source_raw = ''
                     self.transformer_accumulating = False
                     self.within_python_line = False
                     for t in self.transforms:
                         try:
                             t.reset()
                         except SyntaxError:
                             # Nothing that calls reset() expects to handle transformer
                             # errors
                             pass
                 def flush_transformers(self):
                     def _flush(transform, outs):
                         """yield transformed lines
                         always strings, never None
                         transform: the current transform
                         outs: an iterable of previously transformed inputs.
                              Each may be multiline, which will be passed
                              one line at a time to transform.
                         """
                         for out in outs:
                             for line in out.splitlines():
                                 # push one line at a time
                                 tmp = transform.push(line)
                                 if tmp is not None:
                                     yield tmp
                         # reset the transform
                         tmp = transform.reset()
                         if tmp is not None:
                             yield tmp
                     out = []
                     for t in self.transforms_in_use:
                         out = _flush(t, out)
                     out = list(out)
                     if out:
                         self._store('\n'.join(out))
                 def raw_reset(self):
                     """Return raw input only and perform a full reset.
                     """
                     out = self.source_raw
                     self.reset()
                     return out
                 def source_reset(self):
                     try:
                         self.flush_transformers()
                         return self.source
                     finally:
                         self.reset()
                 def push_accepts_more(self):
                     if self.transformer_accumulating:
                         return True
                     else:
                         return super(IPythonInputSplitter, self).push_accepts_more()
                 def transform_cell(self, cell):
                     """Process and translate a cell of input.
                     """
                     self.reset()
                     try:
                         self.push(cell)
                         self.flush_transformers()
                         return self.source
                     finally:
                         self.reset()
                 def push(self, lines):
                     """Push one or more lines of IPython input.
                     This stores the given lines and returns a status code indicating
                     whether the code forms a complete Python block or not, after processing
                     all input lines for special IPython syntax.
                     Any exceptions generated in compilation are swallowed, but if an
                     exception was produced, the method returns True.
                     Parameters
                     ----------
                     lines : string
                       One or more lines of Python input.
                     Returns
                     -------
                     is_complete : boolean
                       True if the current input source (the result of the current input
                       plus prior inputs) forms a complete Python execution block.  Note that
                       this value is also stored as a private attribute (_is_complete), so it
                       can be queried at any time.
                     """
                     # We must ensure all input is pure unicode
                     lines = cast_unicode(lines, self.encoding)
                     # ''.splitlines() --> [], but we need to push the empty line to transformers
                     lines_list = lines.splitlines()
                     if not lines_list:
                         lines_list = ['']
                     # Store raw source before applying any transformations to it.  Note
                     # that this must be done *after* the reset() call that would otherwise
                     # flush the buffer.
                     self._store(lines, self._buffer_raw, 'source_raw')
                     for line in lines_list:
                         out = self.push_line(line)
                     return out
                 def push_line(self, line):
                     buf = self._buffer
                     def _accumulating(dbg):
                         #print(dbg)
                         self.transformer_accumulating = True
                         return False
                     for transformer in self.physical_line_transforms:
                         line = transformer.push(line)
                         if line is None:
                             return _accumulating(transformer)
                     if not self.within_python_line:
                         line = self.assemble_logical_lines.push(line)
                         if line is None:
                             return _accumulating('acc logical line')
                         for transformer in self.logical_line_transforms:
                             line = transformer.push(line)
                             if line is None:
                                 return _accumulating(transformer)
                     line = self.assemble_python_lines.push(line)
                     if line is None:
                         self.within_python_line = True
                         return _accumulating('acc python line')
                     else:
                         self.within_python_line = False
                     for transformer in self.python_line_transforms:
                         line = transformer.push(line)
                         if line is None:
                             return _accumulating(transformer)
                     #print("transformers clear") #debug
                     self.transformer_accumulating = False
                     return super(IPythonInputSplitter, self).push(line)