upstream/ipython Commit - r13650:623f7346

1

# -*- coding: utf-8 -*-

1

# -*- coding: utf-8 -*-

2

"""

2

"""

3

Defines a variety of Pygments lexers for highlighting IPython code.

3

Defines a variety of Pygments lexers for highlighting IPython code.

4

5

This includes:

5

This includes:

6

7

IPythonLexer

7

IPythonLexer

8

IPython3Lexer

8

IPython3Lexer

9

Lexers for pure IPython (python + magic/shell commands)

9

Lexers for pure IPython (python + magic/shell commands)

10

11

IPythonPartialTracebackLexer

11

IPythonPartialTracebackLexer

12

IPythonTracebackLexer

12

IPythonTracebackLexer

13

Supports 2.x and 3.x via keyword `python3`. The partial traceback

13

Supports 2.x and 3.x via keyword `python3`. The partial traceback

14

lexer reads everything but the Python code appearing in a traceback.

14

lexer reads everything but the Python code appearing in a traceback.

15

The full lexer combines the partial lexer with an IPython lexer.

15

The full lexer combines the partial lexer with an IPython lexer.

16

17

IPythonConsoleLexer

17

IPythonConsoleLexer

18

A lexer for IPython console sessions, with support for tracebacks.

18

A lexer for IPython console sessions, with support for tracebacks.

19

20

IPyLexer

20

IPyLexer

21

A friendly lexer which examines the first line of text and from it,

21

A friendly lexer which examines the first line of text and from it,

22

decides whether to use an IPython lexer or an IPython console lexer.

22

decides whether to use an IPython lexer or an IPython console lexer.

23

This is probably the only lexer that needs to be explicitly added

23

This is probably the only lexer that needs to be explicitly added

24

to Pygments.

24

to Pygments.

25

26

"""

26

"""

27

#-----------------------------------------------------------------------------

28

29

#

30

# Distributed under the terms of the Modified BSD License.

31

#

32

# The full license is in the file COPYING.txt, distributed with this software.

33

#-----------------------------------------------------------------------------

27

34

28

# Standard library

35

# Standard library

29

import re

36

import re

30

37

31

# Third party

38

# Third party

32

from pygments.lexers import BashLexer, PythonLexer, Python3Lexer

39

from pygments.lexers import BashLexer, PythonLexer, Python3Lexer

33

from pygments.lexer import (

40

from pygments.lexer import (

34

Lexer, DelegatingLexer, RegexLexer, do_insertions, bygroups, using,

41

Lexer, DelegatingLexer, RegexLexer, do_insertions, bygroups, using,

35

)

42

)

36

from pygments.token import (

43

from pygments.token import (

37

Comment, Generic, Keyword, Literal, Name, Operator, Other, Text, Error,

44

Comment, Generic, Keyword, Literal, Name, Operator, Other, Text, Error,

38

)

45

)

39

from pygments.util import get_bool_opt

46

from pygments.util import get_bool_opt

40

47

41

# Local

48

# Local

42

from IPython.testing.skipdoctest import skip_doctest

49

from IPython.testing.skipdoctest import skip_doctest

43

50

44

line_re = re.compile('.*?\n')

51

line_re = re.compile('.*?\n')

45

52

46

ipython_tokens = [

53

ipython_tokens = [

47

(r'(\%+)(\w+)\s+(\.*)(\n)', bygroups(Operator, Keyword,

54

(r'(\%+)(\w+)\s+(\.*)(\n)', bygroups(Operator, Keyword,

48

using(BashLexer), Text)),

55

using(BashLexer), Text)),

49

(r'(\%+)(\w+)\b', bygroups(Operator, Keyword)),

56

(r'(\%+)(\w+)\b', bygroups(Operator, Keyword)),

50

(r'^(!)(.+)(\n)', bygroups(Operator, using(BashLexer), Text)),

57

(r'^(!)(.+)(\n)', bygroups(Operator, using(BashLexer), Text)),

51

]

58

]

52

59

53

def build_ipy_lexer(python3):

60

def build_ipy_lexer(python3):

54

"""Builds IPython lexers depending on the value of `python3`.

61

"""Builds IPython lexers depending on the value of `python3`.

55

62

56

The lexer inherits from an appropriate Python lexer and then adds

63

The lexer inherits from an appropriate Python lexer and then adds

57

information about IPython specific keywords (i.e. magic commands,

64

information about IPython specific keywords (i.e. magic commands,

58

shell commands, etc.)

65

shell commands, etc.)

59

66

60

Parameters

67

Parameters

61

----------

68

----------

62

python3 : bool

69

python3 : bool

63

If `True`, then build an IPython lexer from a Python 3 lexer.

70

If `True`, then build an IPython lexer from a Python 3 lexer.

64

71

65

"""

72

"""

66

# It would be nice to have a single IPython lexer class which takes

73

# It would be nice to have a single IPython lexer class which takes

67

# a boolean `python3`. But since there are two Python lexer classes,

74

# a boolean `python3`. But since there are two Python lexer classes,

68

# we will also have two IPython lexer classes.

75

# we will also have two IPython lexer classes.

69

if python3:

76

if python3:

70

PyLexer = Python3Lexer

77

PyLexer = Python3Lexer

71

clsname = 'IPython3Lexer'

78

clsname = 'IPython3Lexer'

72

name = 'IPython3'

79

name = 'IPython3'

73

aliases = ['ipython3']

80

aliases = ['ipython3']

74

doc = """IPython3 Lexer"""

81

doc = """IPython3 Lexer"""

75

else:

82

else:

76

PyLexer = PythonLexer

83

PyLexer = PythonLexer

77

clsname = 'IPythonLexer'

84

clsname = 'IPythonLexer'

78

name = 'IPython'

85

name = 'IPython'

79

aliases = ['ipython']

86

aliases = ['ipython']

80

doc = """IPython Lexer"""

87

doc = """IPython Lexer"""

81

88

82

tokens = PyLexer.tokens.copy()

89

tokens = PyLexer.tokens.copy()

83

tokens['root'] = ipython_tokens + tokens['root']

90

tokens['root'] = ipython_tokens + tokens['root']

84

91

85

attrs = {'name': name, 'aliases': aliases,

92

attrs = {'name': name, 'aliases': aliases,

86

'__doc__': doc, 'tokens': tokens}

93

'__doc__': doc, 'tokens': tokens}

87

94

88

return type(name, (PyLexer,), attrs)

95

return type(name, (PyLexer,), attrs)

89

96

90

97

91

IPython3Lexer = build_ipy_lexer(python3=True)

98

IPython3Lexer = build_ipy_lexer(python3=True)

92

IPythonLexer = build_ipy_lexer(python3=False)

99

IPythonLexer = build_ipy_lexer(python3=False)

93

100

94

101

95

class IPythonPartialTracebackLexer(RegexLexer):

102

class IPythonPartialTracebackLexer(RegexLexer):

96

"""

103

"""

97

Partial lexer for IPython tracebacks.

104

Partial lexer for IPython tracebacks.

98

105

99

Handles all the non-python output. This works for both Python 2.x and 3.x.

106

Handles all the non-python output. This works for both Python 2.x and 3.x.

100

107

101

"""

108

"""

102

name = 'IPython Partial Traceback'

109

name = 'IPython Partial Traceback'

103

110

104

tokens = {

111

tokens = {

105

'root': [

112

'root': [

106

# Tracebacks for syntax errors have a different style.

113

# Tracebacks for syntax errors have a different style.

107

# For both types of tracebacks, we mark the first line with

114

# For both types of tracebacks, we mark the first line with

108

# Generic.Traceback. For syntax errors, we mark the filename

115

# Generic.Traceback. For syntax errors, we mark the filename

109

# as we mark the filenames for non-syntax tracebacks.

116

# as we mark the filenames for non-syntax tracebacks.

110

#

117

#

111

# These two regexps define how IPythonConsoleLexer finds a

118

# These two regexps define how IPythonConsoleLexer finds a

112

# traceback.

119

# traceback.

113

#

120

#

114

## Non-syntax traceback

121

## Non-syntax traceback

115

(r'^(\^C)?(-+\n)', bygroups(Error, Generic.Traceback)),

122

(r'^(\^C)?(-+\n)', bygroups(Error, Generic.Traceback)),

116

## Syntax traceback

123

## Syntax traceback

117

(r'^( File)(.*)(, line )(\d+\n)',

124

(r'^( File)(.*)(, line )(\d+\n)',

118

bygroups(Generic.Traceback, Name.Namespace,

125

bygroups(Generic.Traceback, Name.Namespace,

119

Generic.Traceback, Literal.Number.Integer)),

126

Generic.Traceback, Literal.Number.Integer)),

120

127

121

# (Exception Identifier)(Whitespace)(Traceback Message)

128

# (Exception Identifier)(Whitespace)(Traceback Message)

122

(r'(?u)(^[^\d\W]\w*)(\s*)(Traceback.*?\n)',

129

(r'(?u)(^[^\d\W]\w*)(\s*)(Traceback.*?\n)',

123

bygroups(Name.Exception, Generic.Whitespace, Text)),

130

bygroups(Name.Exception, Generic.Whitespace, Text)),

124

# (Module/Filename)(Text)(Callee)(Function Signature)

131

# (Module/Filename)(Text)(Callee)(Function Signature)

125

# Better options for callee and function signature?

132

# Better options for callee and function signature?

126

(r'(.*)( in )(.*)(\(.*\)\n)',

133

(r'(.*)( in )(.*)(\(.*\)\n)',

127

bygroups(Name.Namespace, Text, Name.Entity, Name.Tag)),

134

bygroups(Name.Namespace, Text, Name.Entity, Name.Tag)),

128

# Regular line: (Whitespace)(Line Number)(Python Code)

135

# Regular line: (Whitespace)(Line Number)(Python Code)

129

(r'(\s*?)(\d+)(.*?\n)',

136

(r'(\s*?)(\d+)(.*?\n)',

130

bygroups(Generic.Whitespace, Literal.Number.Integer, Other)),

137

bygroups(Generic.Whitespace, Literal.Number.Integer, Other)),

131

# Emphasized line: (Arrow)(Line Number)(Python Code)

138

# Emphasized line: (Arrow)(Line Number)(Python Code)

132

# Using Exception token so arrow color matches the Exception.

139

# Using Exception token so arrow color matches the Exception.

133

(r'(-*>?\s?)(\d+)(.*?\n)',

140

(r'(-*>?\s?)(\d+)(.*?\n)',

134

bygroups(Name.Exception, Literal.Number.Integer, Other)),

141

bygroups(Name.Exception, Literal.Number.Integer, Other)),

135

# (Exception Identifier)(Message)

142

# (Exception Identifier)(Message)

136

(r'(?u)(^[^\d\W]\w*)(:.*?\n)',

143

(r'(?u)(^[^\d\W]\w*)(:.*?\n)',

137

bygroups(Name.Exception, Text)),

144

bygroups(Name.Exception, Text)),

138

# Tag everything else as Other, will be handled later.

145

# Tag everything else as Other, will be handled later.

139

(r'.*\n', Other),

146

(r'.*\n', Other),

140

],

147

],

141

}

148

}

142

149

143

150

144

class IPythonTracebackLexer(DelegatingLexer):

151

class IPythonTracebackLexer(DelegatingLexer):

145

"""

152

"""

146

IPython traceback lexer.

153

IPython traceback lexer.

147

154

148

For doctests, the tracebacks can be snipped as much as desired with the

155

For doctests, the tracebacks can be snipped as much as desired with the

149

exception to the lines that designate a traceback. For non-syntax error

156

exception to the lines that designate a traceback. For non-syntax error

150

tracebacks, this is the line of hyphens. For syntax error tracebacks,

157

tracebacks, this is the line of hyphens. For syntax error tracebacks,

151

this is the line which lists the File and line number.

158

this is the line which lists the File and line number.

152

159

153

"""

160

"""

154

# The lexer inherits from DelegatingLexer. The "root" lexer is an

161

# The lexer inherits from DelegatingLexer. The "root" lexer is an

155

# appropriate IPython lexer, which depends on the value of the boolean

162

# appropriate IPython lexer, which depends on the value of the boolean

156

# `python3`. First, we parse with the partial IPython traceback lexer.

163

# `python3`. First, we parse with the partial IPython traceback lexer.

157

# Then, any code marked with the "Other" token is delegated to the root

164

# Then, any code marked with the "Other" token is delegated to the root

158

# lexer.

165

# lexer.

159

#

166

#

160

name = 'IPython Traceback'

167

name = 'IPython Traceback'

161

aliases = ['ipythontb']

168

aliases = ['ipythontb']

162

169

163

def __init__(self, **options):

170

def __init__(self, **options):

164

self.python3 = get_bool_opt(options, 'python3', False)

171

self.python3 = get_bool_opt(options, 'python3', False)

165

172

166

if self.python3:

173

if self.python3:

167

IPyLexer = IPython3Lexer

174

IPyLexer = IPython3Lexer

168

else:

175

else:

169

IPyLexer = IPythonLexer

176

IPyLexer = IPythonLexer

170

177

171

DelegatingLexer.__init__(self, IPyLexer,

178

DelegatingLexer.__init__(self, IPyLexer,

172

IPythonPartialTracebackLexer, **options)

179

IPythonPartialTracebackLexer, **options)

173

180

174

@skip_doctest

181

@skip_doctest

175

class IPythonConsoleLexer(Lexer):

182

class IPythonConsoleLexer(Lexer):

176

"""

183

"""

177

An IPython console lexer for IPython code-blocks and doctests, such as:

184

An IPython console lexer for IPython code-blocks and doctests, such as:

178

185

179

.. code-block:: rst

186

.. code-block:: rst

180

187

181

.. code-block:: ipythoncon

188

.. code-block:: ipythoncon

182

189

183

In [1]: a = 'foo'

190

In [1]: a = 'foo'

184

191

185

In [2]: a

192

In [2]: a

186

Out[2]: 'foo'

193

Out[2]: 'foo'

187

194

188

In [3]: print a

195

In [3]: print a

189

foo

196

foo

190

197

191

In [4]: 1 / 0

198

In [4]: 1 / 0

192

199

193

200

194

Support is also provided for IPython exceptions:

201

Support is also provided for IPython exceptions:

195

202

196

.. code-block:: rst

203

.. code-block:: rst

197

204

198

.. code-block:: ipythoncon

205

.. code-block:: ipythoncon

199

206

200

In [1]: raise Exception

207

In [1]: raise Exception

201

---------------------------------------------------------------------------

208

---------------------------------------------------------------------------

202

Exception Traceback (most recent call last)

209

Exception Traceback (most recent call last)

203

<ipython-input-1-fca2ab0ca76b> in <module>()

210

<ipython-input-1-fca2ab0ca76b> in <module>()

204

----> 1 raise Exception

211

----> 1 raise Exception

205

212

206

Exception:

213

Exception:

207

214

208

"""

215

"""

209

name = 'IPython console session'

216

name = 'IPython console session'

210

aliases = ['ipythoncon']

217

aliases = ['ipythoncon']

211

mimetypes = ['text/x-ipython-console']

218

mimetypes = ['text/x-ipython-console']

212

219

213

# The regexps used to determine what is input and what is output. The

220

# The regexps used to determine what is input and what is output. The

214

# input regex should be consistent with and also be the combination of

221

# input regex should be consistent with and also be the combination of

215

# the values of the `in_template` and `in2_templates`. For example, the

222

# the values of the `in_template` and `in2_templates`. For example, the

216

# defaults prompts are:

223

# defaults prompts are:

217

#

224

#

218

# c.PromptManager.in_template = 'In [\#]: '

225

# c.PromptManager.in_template = 'In [\#]: '

219

# c.PromptManager.in2_template = ' .\D.: '

226

# c.PromptManager.in2_template = ' .\D.: '

220

# c.PromptManager.out_template = 'Out[\#]: '

227

# c.PromptManager.out_template = 'Out[\#]: '

221

#

228

#

222

# Note, we do not include the trailing whitespace in the regex since

229

# Note, we do not include the trailing whitespace in the regex since

223

# we want to allow blank prompts (and editors often remove trailing

230

# we want to allow blank prompts (and editors often remove trailing

224

# whitespace).

231

# whitespace).

225

#

232

#

226

in1_regex = r'In \[[0-9]+\]: '

233

in1_regex = r'In \[[0-9]+\]: '

227

in2_regex = r' \.\.+\.: '

234

in2_regex = r' \.\.+\.: '

228

out_regex = r'Out\[[0-9]+\]: '

235

out_regex = r'Out\[[0-9]+\]: '

229

236

230

#: The regex to determine when a traceback starts.

237

#: The regex to determine when a traceback starts.

231

ipytb_start = re.compile(r'^(\^C)?(-+\n)|^( File)(.*)(, line )(\d+\n)')

238

ipytb_start = re.compile(r'^(\^C)?(-+\n)|^( File)(.*)(, line )(\d+\n)')

232

239

233

def __init__(self, **options):

240

def __init__(self, **options):

234

"""Initialize the IPython console lexer.

241

"""Initialize the IPython console lexer.

235

242

236

Parameters

243

Parameters

237

----------

244

----------

238

python3 : bool

245

python3 : bool

239

If `True`, then the console inputs are parsed using a Python 3

246

If `True`, then the console inputs are parsed using a Python 3

240

lexer. Otherwise, they are parsed using a Python 2 lexer.

247

lexer. Otherwise, they are parsed using a Python 2 lexer.

241

in1_regex : RegexObject

248

in1_regex : RegexObject

242

The compiled regular expression used to detect the start

249

The compiled regular expression used to detect the start

243

of inputs. Although the IPython configuration setting may have a

250

of inputs. Although the IPython configuration setting may have a

244

trailing whitespace, do not include it in the regex. If `None`,

251

trailing whitespace, do not include it in the regex. If `None`,

245

then the default input prompt is assumed.

252

then the default input prompt is assumed.

246

in2_regex : RegexObject

253

in2_regex : RegexObject

247

The compiled regular expression used to detect the continuation

254

The compiled regular expression used to detect the continuation

248

of inputs. Although the IPython configuration setting may have a

255

of inputs. Although the IPython configuration setting may have a

249

trailing whitespace, do not include it in the regex. If `None`,

256

trailing whitespace, do not include it in the regex. If `None`,

250

then the default input prompt is assumed.

257

then the default input prompt is assumed.

251

out_regex : RegexObject

258

out_regex : RegexObject

252

The compiled regular expression used to detect outputs. If `None`,

259

The compiled regular expression used to detect outputs. If `None`,

253

then the default output prompt is assumed.

260

then the default output prompt is assumed.

254

261

255

"""

262

"""

256

self.python3 = get_bool_opt(options, 'python3', False)

263

self.python3 = get_bool_opt(options, 'python3', False)

257

264

258

in1_regex = options.get('in1_regex', self.in1_regex)

265

in1_regex = options.get('in1_regex', self.in1_regex)

259

in2_regex = options.get('in2_regex', self.in2_regex)

266

in2_regex = options.get('in2_regex', self.in2_regex)

260

out_regex = options.get('out_regex', self.out_regex)

267

out_regex = options.get('out_regex', self.out_regex)

261

268

262

# So that we can work with input and output prompts which have been

269

# So that we can work with input and output prompts which have been

263

# rstrip'd (possibly by editors) we also need rstrip'd variants. If

270

# rstrip'd (possibly by editors) we also need rstrip'd variants. If

264

# we do not do this, then such prompts will be tagged as 'output'.

271

# we do not do this, then such prompts will be tagged as 'output'.

265

# The reason can't just use the rstrip'd variants instead is because

272

# The reason can't just use the rstrip'd variants instead is because

266

# we want any whitespace associated with the prompt to be inserted

273

# we want any whitespace associated with the prompt to be inserted

267

# with the token. This allows formatted code to be modified so as hide

274

# with the token. This allows formatted code to be modified so as hide

268

# the appearance of prompts. For example, see copybutton.js.

275

# the appearance of prompts. For example, see copybutton.js.

269

in1_regex_rstrip = in1_regex.rstrip() + '\n'

276

in1_regex_rstrip = in1_regex.rstrip() + '\n'

270

in2_regex_rstrip = in2_regex.rstrip() + '\n'

277

in2_regex_rstrip = in2_regex.rstrip() + '\n'

271

out_regex_rstrip = out_regex.rstrip() + '\n'

278

out_regex_rstrip = out_regex.rstrip() + '\n'

272

279

273

# Compile and save them all.

280

# Compile and save them all.

274

attrs = ['in1_regex', 'in2_regex', 'out_regex',

281

attrs = ['in1_regex', 'in2_regex', 'out_regex',

275

'in1_regex_rstrip', 'in2_regex_rstrip', 'out_regex_rstrip']

282

'in1_regex_rstrip', 'in2_regex_rstrip', 'out_regex_rstrip']

276

for attr in attrs:

283

for attr in attrs:

277

self.__setattr__(attr, re.compile(locals()[attr]))

284

self.__setattr__(attr, re.compile(locals()[attr]))

278

285

279

Lexer.__init__(self, **options)

286

Lexer.__init__(self, **options)

280

287

281

if self.python3:

288

if self.python3:

282

pylexer = IPython3Lexer

289

pylexer = IPython3Lexer

283

tblexer = IPythonTracebackLexer

290

tblexer = IPythonTracebackLexer

284

else:

291

else:

285

pylexer = IPythonLexer

292

pylexer = IPythonLexer

286

tblexer = IPythonTracebackLexer

293

tblexer = IPythonTracebackLexer

287

294

288

self.pylexer = pylexer(**options)

295

self.pylexer = pylexer(**options)

289

self.tblexer = tblexer(**options)

296

self.tblexer = tblexer(**options)

290

297

291

self.reset()

298

self.reset()

292

299

293

def reset(self):

300

def reset(self):

294

self.mode = 'output'

301

self.mode = 'output'

295

self.index = 0

302

self.index = 0

296

self.buffer = u''

303

self.buffer = u''

297

self.insertions = []

304

self.insertions = []

298

305

299

def buffered_tokens(self):

306

def buffered_tokens(self):

300

"""

307

"""

301

Generator of unprocessed tokens after doing insertions and before

308

Generator of unprocessed tokens after doing insertions and before

302

changing to a new state.

309

changing to a new state.

303

310

304

"""

311

"""

305

if self.mode == 'output':

312

if self.mode == 'output':

306

tokens = [(0, Generic.Output, self.buffer)]

313

tokens = [(0, Generic.Output, self.buffer)]

307

elif self.mode == 'input':

314

elif self.mode == 'input':

308

tokens = self.pylexer.get_tokens_unprocessed(self.buffer)

315

tokens = self.pylexer.get_tokens_unprocessed(self.buffer)

309

else: # traceback

316

else: # traceback

310

tokens = self.tblexer.get_tokens_unprocessed(self.buffer)

317

tokens = self.tblexer.get_tokens_unprocessed(self.buffer)

311

318

312

for i, t, v in do_insertions(self.insertions, tokens):

319

for i, t, v in do_insertions(self.insertions, tokens):

313

# All token indexes are relative to the buffer.

320

# All token indexes are relative to the buffer.

314

yield self.index + i, t, v

321

yield self.index + i, t, v

315

322

316

# Clear it all

323

# Clear it all

317

self.index += len(self.buffer)

324

self.index += len(self.buffer)

318

self.buffer = u''

325

self.buffer = u''

319

self.insertions = []

326

self.insertions = []

320

327

321

def get_modecode(self, line):

328

def get_modecode(self, line):

322

"""

329

"""

323

Returns the next mode and code to be added to the next mode's buffer.

330

Returns the next mode and code to be added to the next mode's buffer.

324

331

325

The next mode depends on current mode and contents of line.

332

The next mode depends on current mode and contents of line.

326

333

327

"""

334

"""

328

# To reduce the number of regex match checks, we have multiple

335

# To reduce the number of regex match checks, we have multiple

329

# 'if' blocks instead of 'if-elif' blocks.

336

# 'if' blocks instead of 'if-elif' blocks.

330

337

331

### Check for possible end of input

338

### Check for possible end of input

332

###

339

###

333

in2_match = self.in2_regex.match(line)

340

in2_match = self.in2_regex.match(line)

334

in2_match_rstrip = self.in2_regex_rstrip.match(line)

341

in2_match_rstrip = self.in2_regex_rstrip.match(line)

335

if (in2_match and in2_match.group().rstrip() == line.rstrip()) or \

342

if (in2_match and in2_match.group().rstrip() == line.rstrip()) or \

336

in2_match_rstrip:

343

in2_match_rstrip:

337

end_input = True

344

end_input = True

338

else:

345

else:

339

end_input = False

346

end_input = False

340

if end_input and self.mode != 'tb':

347

if end_input and self.mode != 'tb':

341

# Only look for an end of input when not in tb mode.

348

# Only look for an end of input when not in tb mode.

342

# An ellipsis could appear within the traceback.

349

# An ellipsis could appear within the traceback.

343

mode = 'output'

350

mode = 'output'

344

code = u''

351

code = u''

345

insertion = (0, Generic.Prompt, line)

352

insertion = (0, Generic.Prompt, line)

346

return mode, code, insertion

353

return mode, code, insertion

347

354

348

### Check for output prompt

355

### Check for output prompt

349

###

356

###

350

out_match = self.out_regex.match(line)

357

out_match = self.out_regex.match(line)

351

out_match_rstrip = self.out_regex_rstrip.match(line)

358

out_match_rstrip = self.out_regex_rstrip.match(line)

352

if out_match or out_match_rstrip:

359

if out_match or out_match_rstrip:

353

mode = 'output'

360

mode = 'output'

354

if out_match:

361

if out_match:

355

idx = out_match.end()

362

idx = out_match.end()

356

else:

363

else:

357

idx = out_match_rstrip.end()

364

idx = out_match_rstrip.end()

358

code = line[idx:]

365

code = line[idx:]

359

# Use the 'heading' token for output. We cannot use Generic.Error

366

# Use the 'heading' token for output. We cannot use Generic.Error

360

# since it would conflict with exceptions.

367

# since it would conflict with exceptions.

361

insertion = (0, Generic.Heading, line[:idx])

368

insertion = (0, Generic.Heading, line[:idx])

362

return mode, code, insertion

369

return mode, code, insertion

363

370

364

371

365

### Check for input or continuation prompt (non stripped version)

372

### Check for input or continuation prompt (non stripped version)

366

###

373

###

367

in1_match = self.in1_regex.match(line)

374

in1_match = self.in1_regex.match(line)

368

if in1_match or (in2_match and self.mode != 'tb'):

375

if in1_match or (in2_match and self.mode != 'tb'):

369

# New input or when not in tb, continued input.

376

# New input or when not in tb, continued input.

370

# We do not check for continued input when in tb since it is

377

# We do not check for continued input when in tb since it is

371

# allowable to replace a long stack with an ellipsis.

378

# allowable to replace a long stack with an ellipsis.

372

mode = 'input'

379

mode = 'input'

373

if in1_match:

380

if in1_match:

374

idx = in1_match.end()

381

idx = in1_match.end()

375

else: # in2_match

382

else: # in2_match

376

idx = in2_match.end()

383

idx = in2_match.end()

377

code = line[idx:]

384

code = line[idx:]

378

insertion = (0, Generic.Prompt, line[:idx])

385

insertion = (0, Generic.Prompt, line[:idx])

379

return mode, code, insertion

386

return mode, code, insertion

380

387

381

### Check for input or continuation prompt (stripped version)

388

### Check for input or continuation prompt (stripped version)

382

###

389

###

383

in1_match_rstrip = self.in1_regex_rstrip.match(line)

390

in1_match_rstrip = self.in1_regex_rstrip.match(line)

384

if in1_match_rstrip or (in2_match_rstrip and self.mode != 'tb'):

391

if in1_match_rstrip or (in2_match_rstrip and self.mode != 'tb'):

385

# New input or when not in tb, continued input.

392

# New input or when not in tb, continued input.

386

# We do not check for continued input when in tb since it is

393

# We do not check for continued input when in tb since it is

387

# allowable to replace a long stack with an ellipsis.

394

# allowable to replace a long stack with an ellipsis.

388

mode = 'input'

395

mode = 'input'

389

if in1_match_rstrip:

396

if in1_match_rstrip:

390

idx = in1_match_rstrip.end()

397

idx = in1_match_rstrip.end()

391

else: # in2_match

398

else: # in2_match

392

idx = in2_match_rstrip.end()

399

idx = in2_match_rstrip.end()

393

code = line[idx:]

400

code = line[idx:]

394

insertion = (0, Generic.Prompt, line[:idx])

401

insertion = (0, Generic.Prompt, line[:idx])

395

return mode, code, insertion

402

return mode, code, insertion

396

403

397

### Check for traceback

404

### Check for traceback

398

###

405

###

399

if self.ipytb_start.match(line):

406

if self.ipytb_start.match(line):

400

mode = 'tb'

407

mode = 'tb'

401

code = line

408

code = line

402

insertion = None

409

insertion = None

403

return mode, code, insertion

410

return mode, code, insertion

404

411

405

### All other stuff...

412

### All other stuff...

406

###

413

###

407

if self.mode in ('input', 'output'):

414

if self.mode in ('input', 'output'):

408

# We assume all other text is output. Multiline input that

415

# We assume all other text is output. Multiline input that

409

# does not use the continuation marker cannot be detected.

416

# does not use the continuation marker cannot be detected.

410

# For example, the 3 in the following is clearly output:

417

# For example, the 3 in the following is clearly output:

411

#

418

#

412

# In [1]: print 3

419

# In [1]: print 3

413

# 3

420

# 3

414

#

421

#

415

# But the following second line is part of the input:

422

# But the following second line is part of the input:

416

#

423

#

417

# In [2]: while True:

424

# In [2]: while True:

418

# print True

425

# print True

419

#

426

#

420

# In both cases, the 2nd line will be 'output'.

427

# In both cases, the 2nd line will be 'output'.

421

#

428

#

422

mode = 'output'

429

mode = 'output'

423

else:

430

else:

424

mode = 'tb'

431

mode = 'tb'

425

432

426

code = line

433

code = line

427

insertion = None

434

insertion = None

428

435

429

return mode, code, insertion

436

return mode, code, insertion

430

437

431

def get_tokens_unprocessed(self, text):

438

def get_tokens_unprocessed(self, text):

432

self.reset()

439

self.reset()

433

for match in line_re.finditer(text):

440

for match in line_re.finditer(text):

434

line = match.group()

441

line = match.group()

435

mode, code, insertion = self.get_modecode(line)

442

mode, code, insertion = self.get_modecode(line)

436

443

437

if mode != self.mode:

444

if mode != self.mode:

438

# Yield buffered tokens before transitioning to new mode.

445

# Yield buffered tokens before transitioning to new mode.

439

for token in self.buffered_tokens():

446

for token in self.buffered_tokens():

440

yield token

447

yield token

441

self.mode = mode

448

self.mode = mode

442

449

443

if insertion:

450

if insertion:

444

self.insertions.append((len(self.buffer), [insertion]))

451

self.insertions.append((len(self.buffer), [insertion]))

445

self.buffer += code

452

self.buffer += code

446

else:

453

else:

447

for token in self.buffered_tokens():

454

for token in self.buffered_tokens():

448

yield token

455

yield token

449

456

450

class IPyLexer(Lexer):

457

class IPyLexer(Lexer):

451

"""

458

"""

452

Primary lexer for all IPython-like code.

459

Primary lexer for all IPython-like code.

453

460

454

This is a simple helper lexer. If the first line of the text begins with

461

This is a simple helper lexer. If the first line of the text begins with

455

"In \[[0-9]+\]:", then the entire text is parsed with an IPython console

462

"In \[[0-9]+\]:", then the entire text is parsed with an IPython console

456

lexer. If not, then the entire text is parsed with an IPython lexer.

463

lexer. If not, then the entire text is parsed with an IPython lexer.

457

464

458

The goal is to reduce the number of lexers that are registered

465

The goal is to reduce the number of lexers that are registered

459

with Pygments.

466

with Pygments.

460

467

461

"""

468

"""

462

name = 'IPy session'

469

name = 'IPy session'

463

aliases = ['ipy']

470

aliases = ['ipy']

464

471

465

def __init__(self, **options):

472

def __init__(self, **options):

466

self.python3 = get_bool_opt(options, 'python3', False)

473

self.python3 = get_bool_opt(options, 'python3', False)

467

Lexer.__init__(self, **options)

474

Lexer.__init__(self, **options)

468

475

469

self.IPythonLexer = IPythonLexer(**options)

476

self.IPythonLexer = IPythonLexer(**options)

470

self.IPythonConsoleLexer = IPythonConsoleLexer(**options)

477

self.IPythonConsoleLexer = IPythonConsoleLexer(**options)

471

478

472

def get_tokens_unprocessed(self, text):

479

def get_tokens_unprocessed(self, text):

473

if re.match(r'(In \[[0-9]+\]:)', text.strip()):

480

if re.match(r'(In \[[0-9]+\]:)', text.strip()):

474

lex = self.IPythonConsoleLexer

481

lex = self.IPythonConsoleLexer

475

else:

482

else:

476

lex = self.IPythonLexer

483

lex = self.IPythonLexer

477

for token in lex.get_tokens_unprocessed(text):

484

for token in lex.get_tokens_unprocessed(text):

478

yield token

485

yield token

479

486

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages

             # -*- coding: utf-8 -*-
             """
             Defines a variety of Pygments lexers for highlighting IPython code.
             This includes:
                 IPythonLexer
                 IPython3Lexer
                     Lexers for pure IPython (python + magic/shell commands)
                 IPythonPartialTracebackLexer
                 IPythonTracebackLexer
                     Supports 2.x and 3.x via keyword `python3`.  The partial traceback
                     lexer reads everything but the Python code appearing in a traceback.
                     The full lexer combines the partial lexer with an IPython lexer.
                 IPythonConsoleLexer
                     A lexer for IPython console sessions, with support for tracebacks.
                 IPyLexer
                     A friendly lexer which examines the first line of text and from it,
                     decides whether to use an IPython lexer or an IPython console lexer.
                     This is probably the only lexer that needs to be explicitly added
                     to Pygments.
             """
+            #-----------------------------------------------------------------------------
+            # Copyright (c) 2013, the IPython Development Team.
+            #
+            # Distributed under the terms of the Modified BSD License.
+            #
+            # The full license is in the file COPYING.txt, distributed with this software.
+            #-----------------------------------------------------------------------------
             # Standard library
             import re
             # Third party
             from pygments.lexers import BashLexer, PythonLexer, Python3Lexer
             from pygments.lexer import (
                 Lexer, DelegatingLexer, RegexLexer, do_insertions, bygroups, using,
             )
             from pygments.token import (
                 Comment, Generic, Keyword, Literal, Name, Operator, Other, Text, Error,
             )
             from pygments.util import get_bool_opt
             # Local
             from IPython.testing.skipdoctest import skip_doctest
             line_re = re.compile('.*?\n')
             ipython_tokens = [
               (r'(\%+)(\w+)\s+(\.*)(\n)', bygroups(Operator, Keyword,
                                                    using(BashLexer), Text)),
               (r'(\%+)(\w+)\b', bygroups(Operator, Keyword)),
               (r'^(!)(.+)(\n)', bygroups(Operator, using(BashLexer), Text)),
             ]
             def build_ipy_lexer(python3):
                 """Builds IPython lexers depending on the value of `python3`.
                 The lexer inherits from an appropriate Python lexer and then adds
                 information about IPython specific keywords (i.e. magic commands,
                 shell commands, etc.)
                 Parameters
                 ----------
                 python3 : bool
                     If `True`, then build an IPython lexer from a Python 3 lexer.
                 """
                 # It would be nice to have a single IPython lexer class which takes
                 # a boolean `python3`.  But since there are two Python lexer classes,
                 # we will also have two IPython lexer classes.
                 if python3:
                     PyLexer = Python3Lexer
                     clsname = 'IPython3Lexer'
                     name = 'IPython3'
                     aliases = ['ipython3']
                     doc = """IPython3 Lexer"""
                 else:
                     PyLexer = PythonLexer
                     clsname = 'IPythonLexer'
                     name = 'IPython'
                     aliases = ['ipython']
                     doc = """IPython Lexer"""
                 tokens = PyLexer.tokens.copy()
                 tokens['root'] = ipython_tokens + tokens['root']
                 attrs = {'name': name, 'aliases': aliases,
                          '__doc__': doc, 'tokens': tokens}
                 return type(name, (PyLexer,), attrs)
             IPython3Lexer = build_ipy_lexer(python3=True)
             IPythonLexer = build_ipy_lexer(python3=False)
             class IPythonPartialTracebackLexer(RegexLexer):
                 """
                 Partial lexer for IPython tracebacks.
                 Handles all the non-python output. This works for both Python 2.x and 3.x.
                 """
                 name = 'IPython Partial Traceback'
                 tokens = {
                     'root': [
                         # Tracebacks for syntax errors have a different style.
                         # For both types of tracebacks, we mark the first line with
                         # Generic.Traceback.  For syntax errors, we mark the filename
                         # as we mark the filenames for non-syntax tracebacks.
                         #
                         # These two regexps define how IPythonConsoleLexer finds a
                         # traceback.
                         #
                         ## Non-syntax traceback
                         (r'^(\^C)?(-+\n)', bygroups(Error, Generic.Traceback)),
                         ## Syntax traceback
                         (r'^(  File)(.*)(, line )(\d+\n)',
                          bygroups(Generic.Traceback, Name.Namespace,
                                   Generic.Traceback, Literal.Number.Integer)),
                         # (Exception Identifier)(Whitespace)(Traceback Message)
                         (r'(?u)(^[^\d\W]\w*)(\s*)(Traceback.*?\n)',
                          bygroups(Name.Exception, Generic.Whitespace, Text)),
                         # (Module/Filename)(Text)(Callee)(Function Signature)
                         # Better options for callee and function signature?
                         (r'(.*)( in )(.*)(\(.*\)\n)',
                          bygroups(Name.Namespace, Text, Name.Entity, Name.Tag)),
                         # Regular line: (Whitespace)(Line Number)(Python Code)
                         (r'(\s*?)(\d+)(.*?\n)',
                          bygroups(Generic.Whitespace, Literal.Number.Integer, Other)),
                         # Emphasized line: (Arrow)(Line Number)(Python Code)
                         # Using Exception token so arrow color matches the Exception.
                         (r'(-*>?\s?)(\d+)(.*?\n)',
                          bygroups(Name.Exception, Literal.Number.Integer, Other)),
                         # (Exception Identifier)(Message)
                         (r'(?u)(^[^\d\W]\w*)(:.*?\n)',
                          bygroups(Name.Exception, Text)),
                         # Tag everything else as Other, will be handled later.
                         (r'.*\n', Other),
                     ],
                 }
             class IPythonTracebackLexer(DelegatingLexer):
                 """
                 IPython traceback lexer.
                 For doctests, the tracebacks can be snipped as much as desired with the
                 exception to the lines that designate a traceback. For non-syntax error
                 tracebacks, this is the line of hyphens. For syntax error tracebacks,
                 this is the line which lists the File and line number.
                 """
                 # The lexer inherits from DelegatingLexer.  The "root" lexer is an
                 # appropriate IPython lexer, which depends on the value of the boolean
                 # `python3`.  First, we parse with the partial IPython traceback lexer.
                 # Then, any code marked with the "Other" token is delegated to the root
                 # lexer.
                 #
                 name = 'IPython Traceback'
                 aliases = ['ipythontb']
                 def __init__(self, **options):
                     self.python3 = get_bool_opt(options, 'python3', False)
                     if self.python3:
                         IPyLexer = IPython3Lexer
                     else:
                         IPyLexer = IPythonLexer
                     DelegatingLexer.__init__(self, IPyLexer,
                                              IPythonPartialTracebackLexer, **options)
             @skip_doctest
             class IPythonConsoleLexer(Lexer):
                 """
                 An IPython console lexer for IPython code-blocks and doctests, such as:
                 .. code-block:: rst
                     .. code-block:: ipythoncon
                         In [1]: a = 'foo'
                         In [2]: a
                         Out[2]: 'foo'
                         In [3]: print a
                         foo
                         In [4]: 1 / 0
                 Support is also provided for IPython exceptions:
                 .. code-block:: rst
                     .. code-block:: ipythoncon
                         In [1]: raise Exception
                         ---------------------------------------------------------------------------
                         Exception                                 Traceback (most recent call last)
                         <ipython-input-1-fca2ab0ca76b> in <module>()
                         ----> 1 raise Exception
                         Exception:
                 """
                 name = 'IPython console session'
                 aliases = ['ipythoncon']
                 mimetypes = ['text/x-ipython-console']
                 # The regexps used to determine what is input and what is output. The
                 # input regex should be consistent with and also be the combination of
                 # the values of the `in_template` and `in2_templates`. For example, the
                 # defaults prompts are:
                 #
                 #     c.PromptManager.in_template  = 'In [\#]: '
                 #     c.PromptManager.in2_template = '   .\D.: '
                 #     c.PromptManager.out_template = 'Out[\#]: '
                 #
                 # Note, we do not include the trailing whitespace in the regex since
                 # we want to allow blank prompts (and editors often remove trailing
                 # whitespace).
                 #
                 in1_regex = r'In \[[0-9]+\]: '
                 in2_regex = r'   \.\.+\.: '
                 out_regex = r'Out\[[0-9]+\]: '
                 #: The regex to determine when a traceback starts.
                 ipytb_start = re.compile(r'^(\^C)?(-+\n)|^(  File)(.*)(, line )(\d+\n)')
                 def __init__(self, **options):
                     """Initialize the IPython console lexer.
                     Parameters
                     ----------
                     python3 : bool
                         If `True`, then the console inputs are parsed using a Python 3
                         lexer. Otherwise, they are parsed using a Python 2 lexer.
                     in1_regex : RegexObject
                         The compiled regular expression used to detect the start
                         of inputs. Although the IPython configuration setting may have a
                         trailing whitespace, do not include it in the regex. If `None`,
                         then the default input prompt is assumed.
                     in2_regex : RegexObject
                         The compiled regular expression used to detect the continuation
                         of inputs. Although the IPython configuration setting may have a
                         trailing whitespace, do not include it in the regex. If `None`,
                         then the default input prompt is assumed.
                     out_regex : RegexObject
                         The compiled regular expression used to detect outputs. If `None`,
                         then the default output prompt is assumed.
                     """
                     self.python3 = get_bool_opt(options, 'python3', False)
                     in1_regex = options.get('in1_regex', self.in1_regex)
                     in2_regex = options.get('in2_regex', self.in2_regex)
                     out_regex = options.get('out_regex', self.out_regex)
                     # So that we can work with input and output prompts which have been
                     # rstrip'd (possibly by editors) we also need rstrip'd variants. If
                     # we do not do this, then such prompts will be tagged as 'output'.
                     # The reason can't just use the rstrip'd variants instead is because
                     # we want any whitespace associated with the prompt to be inserted
                     # with the token. This allows formatted code to be modified so as hide
                     # the appearance of prompts.  For example, see copybutton.js.
                     in1_regex_rstrip = in1_regex.rstrip() + '\n'
                     in2_regex_rstrip = in2_regex.rstrip() + '\n'
                     out_regex_rstrip = out_regex.rstrip() + '\n'
                     # Compile and save them all.
                     attrs = ['in1_regex', 'in2_regex', 'out_regex',
                              'in1_regex_rstrip', 'in2_regex_rstrip', 'out_regex_rstrip']
                     for attr in attrs:
                         self.__setattr__(attr, re.compile(locals()[attr]))
                     Lexer.__init__(self, **options)
                     if self.python3:
                         pylexer = IPython3Lexer
                         tblexer = IPythonTracebackLexer
                     else:
                         pylexer = IPythonLexer
                         tblexer = IPythonTracebackLexer
                     self.pylexer = pylexer(**options)
                     self.tblexer = tblexer(**options)
                     self.reset()
                 def reset(self):
                     self.mode = 'output'
                     self.index = 0
                     self.buffer = u''
                     self.insertions = []
                 def buffered_tokens(self):
                     """
                     Generator of unprocessed tokens after doing insertions and before
                     changing to a new state.
                     """
                     if self.mode == 'output':
                         tokens = [(0, Generic.Output, self.buffer)]
                     elif self.mode == 'input':
                         tokens = self.pylexer.get_tokens_unprocessed(self.buffer)
                     else: # traceback
                         tokens = self.tblexer.get_tokens_unprocessed(self.buffer)
                     for i, t, v in do_insertions(self.insertions, tokens):
                         # All token indexes are relative to the buffer.
                         yield self.index + i, t, v
                     # Clear it all
                     self.index += len(self.buffer)
                     self.buffer = u''
                     self.insertions = []
                 def get_modecode(self, line):
                     """
                     Returns the next mode and code to be added to the next mode's buffer.
                     The next mode depends on current mode and contents of line.
                     """
                     # To reduce the number of regex match checks, we have multiple
                     # 'if' blocks instead of 'if-elif' blocks.
                     ### Check for possible end of input
                     ###
                     in2_match = self.in2_regex.match(line)
                     in2_match_rstrip = self.in2_regex_rstrip.match(line)
                     if (in2_match and in2_match.group().rstrip() == line.rstrip()) or \
                        in2_match_rstrip:
                         end_input = True
                     else:
                         end_input = False
                     if end_input and self.mode != 'tb':
                         # Only look for an end of input when not in tb mode.
                         # An ellipsis could appear within the traceback.
                         mode = 'output'
                         code = u''
                         insertion = (0, Generic.Prompt, line)
                         return mode, code, insertion
                     ### Check for output prompt
                     ###
                     out_match = self.out_regex.match(line)
                     out_match_rstrip = self.out_regex_rstrip.match(line)
                     if out_match or out_match_rstrip:
                         mode = 'output'
                         if out_match:
                             idx = out_match.end()
                         else:
                             idx = out_match_rstrip.end()
                         code = line[idx:]
                         # Use the 'heading' token for output.  We cannot use Generic.Error
                         # since it would conflict with exceptions.
                         insertion = (0, Generic.Heading, line[:idx])
                         return mode, code, insertion
                     ### Check for input or continuation prompt (non stripped version)
                     ###
                     in1_match = self.in1_regex.match(line)
                     if in1_match or (in2_match and self.mode != 'tb'):
                         # New input or when not in tb, continued input.
                         # We do not check for continued input when in tb since it is
                         # allowable to replace a long stack with an ellipsis.
                         mode = 'input'
                         if in1_match:
                             idx = in1_match.end()
                         else: # in2_match
                             idx = in2_match.end()
                         code = line[idx:]
                         insertion = (0, Generic.Prompt, line[:idx])
                         return mode, code, insertion
                     ### Check for input or continuation prompt (stripped version)
                     ###
                     in1_match_rstrip = self.in1_regex_rstrip.match(line)
                     if in1_match_rstrip or (in2_match_rstrip and self.mode != 'tb'):
                         # New input or when not in tb, continued input.
                         # We do not check for continued input when in tb since it is
                         # allowable to replace a long stack with an ellipsis.
                         mode = 'input'
                         if in1_match_rstrip:
                             idx = in1_match_rstrip.end()
                         else: # in2_match
                             idx = in2_match_rstrip.end()
                         code = line[idx:]
                         insertion = (0, Generic.Prompt, line[:idx])
                         return mode, code, insertion
                     ### Check for traceback
                     ###
                     if self.ipytb_start.match(line):
                         mode = 'tb'
                         code = line
                         insertion = None
                         return mode, code, insertion
                     ### All other stuff...
                     ###
                     if self.mode in ('input', 'output'):
                         # We assume all other text is output. Multiline input that
                         # does not use the continuation marker cannot be detected.
                         # For example, the 3 in the following is clearly output:
                         #
                         #    In [1]: print 3
                         #    3
                         #
                         # But the following second line is part of the input:
                         #
                         #    In [2]: while True:
                         #        print True
                         #
                         # In both cases, the 2nd line will be 'output'.
                         #
                         mode = 'output'
                     else:
                         mode = 'tb'
                     code = line
                     insertion = None
                     return mode, code, insertion
                 def get_tokens_unprocessed(self, text):
                     self.reset()
                     for match in line_re.finditer(text):
                         line = match.group()
                         mode, code, insertion = self.get_modecode(line)
                         if mode != self.mode:
                             # Yield buffered tokens before transitioning to new mode.
                             for token in self.buffered_tokens():
                                 yield token
                             self.mode = mode
                         if insertion:
                             self.insertions.append((len(self.buffer), [insertion]))
                         self.buffer += code
                     else:
                         for token in self.buffered_tokens():
                             yield token
             class IPyLexer(Lexer):
                 """
                 Primary lexer for all IPython-like code.
                 This is a simple helper lexer.  If the first line of the text begins with
                 "In \[[0-9]+\]:", then the entire text is parsed with an IPython console
                 lexer. If not, then the entire text is parsed with an IPython lexer.
                 The goal is to reduce the number of lexers that are registered
                 with Pygments.
                 """
                 name = 'IPy session'
                 aliases = ['ipy']
                 def __init__(self, **options):
                     self.python3 = get_bool_opt(options, 'python3', False)
                     Lexer.__init__(self, **options)
                     self.IPythonLexer = IPythonLexer(**options)
                     self.IPythonConsoleLexer = IPythonConsoleLexer(**options)
                 def get_tokens_unprocessed(self, text):
                     if re.match(r'(In \[[0-9]+\]:)', text.strip()):
                         lex = self.IPythonConsoleLexer
                     else:
                         lex = self.IPythonLexer
                     for token in lex.get_tokens_unprocessed(text):
                         yield token