python.js
324 lines
| 10.6 KiB
| application/javascript
|
JavascriptLexer
Fernando Perez
|
r4933 | CodeMirror.defineMode("python", function(conf, parserConf) { | ||
Brian E. Granger
|
r4504 | var ERRORCLASS = 'error'; | ||
Fernando Perez
|
r4934 | |||
Brian E. Granger
|
r4504 | function wordRegexp(words) { | ||
return new RegExp("^((" + words.join(")|(") + "))\\b"); | ||||
} | ||||
Fernando Perez
|
r4934 | |||
Fernando Perez
|
r4981 | // IPython-specific changes: add '?' as recognized character. | ||
//var singleOperators = new RegExp("^[\\+\\-\\*/%&|\\^~<>!]"); | ||||
var singleOperators = new RegExp("^[\\+\\-\\*/%&|\\^~<>!\\?]"); | ||||
// End IPython changes. | ||||
Brian E. Granger
|
r4504 | var singleDelimiters = new RegExp('^[\\(\\)\\[\\]\\{\\}@,:`=;\\.]'); | ||
var doubleOperators = new RegExp("^((==)|(!=)|(<=)|(>=)|(<>)|(<<)|(>>)|(//)|(\\*\\*))"); | ||||
var doubleDelimiters = new RegExp("^((\\+=)|(\\-=)|(\\*=)|(%=)|(/=)|(&=)|(\\|=)|(\\^=))"); | ||||
var tripleDelimiters = new RegExp("^((//=)|(>>=)|(<<=)|(\\*\\*=))"); | ||||
var identifiers = new RegExp("^[_A-Za-z][_A-Za-z0-9]*"); | ||||
var wordOperators = wordRegexp(['and', 'or', 'not', 'is', 'in']); | ||||
var commonkeywords = ['as', 'assert', 'break', 'class', 'continue', | ||||
'def', 'del', 'elif', 'else', 'except', 'finally', | ||||
'for', 'from', 'global', 'if', 'import', | ||||
'lambda', 'pass', 'raise', 'return', | ||||
'try', 'while', 'with', 'yield']; | ||||
var commontypes = ['bool', 'classmethod', 'complex', 'dict', 'enumerate', | ||||
'float', 'frozenset', 'int', 'list', 'object', | ||||
'property', 'reversed', 'set', 'slice', 'staticmethod', | ||||
'str', 'super', 'tuple', 'type']; | ||||
var py2 = {'types': ['basestring', 'buffer', 'file', 'long', 'unicode', | ||||
'xrange'], | ||||
'keywords': ['exec', 'print']}; | ||||
var py3 = {'types': ['bytearray', 'bytes', 'filter', 'map', 'memoryview', | ||||
'open', 'range', 'zip'], | ||||
'keywords': ['nonlocal']}; | ||||
Fernando Perez
|
r4933 | if (!!parserConf.version && parseInt(parserConf.version, 10) === 3) { | ||
Brian E. Granger
|
r4504 | commonkeywords = commonkeywords.concat(py3.keywords); | ||
commontypes = commontypes.concat(py3.types); | ||||
var stringPrefixes = new RegExp("^(([rb]|(br))?('{3}|\"{3}|['\"]))", "i"); | ||||
} else { | ||||
commonkeywords = commonkeywords.concat(py2.keywords); | ||||
commontypes = commontypes.concat(py2.types); | ||||
var stringPrefixes = new RegExp("^(([rub]|(ur)|(br))?('{3}|\"{3}|['\"]))", "i"); | ||||
} | ||||
var keywords = wordRegexp(commonkeywords); | ||||
var types = wordRegexp(commontypes); | ||||
var indentInfo = null; | ||||
// tokenizers | ||||
function tokenBase(stream, state) { | ||||
// Handle scope changes | ||||
if (stream.sol()) { | ||||
var scopeOffset = state.scopes[0].offset; | ||||
if (stream.eatSpace()) { | ||||
var lineOffset = stream.indentation(); | ||||
if (lineOffset > scopeOffset) { | ||||
indentInfo = 'indent'; | ||||
} else if (lineOffset < scopeOffset) { | ||||
indentInfo = 'dedent'; | ||||
} | ||||
return null; | ||||
} else { | ||||
if (scopeOffset > 0) { | ||||
dedent(stream, state); | ||||
} | ||||
} | ||||
} | ||||
if (stream.eatSpace()) { | ||||
return null; | ||||
} | ||||
Fernando Perez
|
r4934 | |||
Brian E. Granger
|
r4504 | var ch = stream.peek(); | ||
Fernando Perez
|
r4934 | |||
Brian E. Granger
|
r4504 | // Handle Comments | ||
if (ch === '#') { | ||||
stream.skipToEnd(); | ||||
return 'comment'; | ||||
} | ||||
Fernando Perez
|
r4934 | |||
Brian E. Granger
|
r4504 | // Handle Number Literals | ||
if (stream.match(/^[0-9\.]/, false)) { | ||||
var floatLiteral = false; | ||||
// Floats | ||||
if (stream.match(/^\d*\.\d+(e[\+\-]?\d+)?/i)) { floatLiteral = true; } | ||||
if (stream.match(/^\d+\.\d*/)) { floatLiteral = true; } | ||||
if (stream.match(/^\.\d+/)) { floatLiteral = true; } | ||||
if (floatLiteral) { | ||||
// Float literals may be "imaginary" | ||||
stream.eat(/J/i); | ||||
return 'number'; | ||||
} | ||||
// Integers | ||||
var intLiteral = false; | ||||
// Hex | ||||
if (stream.match(/^0x[0-9a-f]+/i)) { intLiteral = true; } | ||||
// Binary | ||||
if (stream.match(/^0b[01]+/i)) { intLiteral = true; } | ||||
// Octal | ||||
if (stream.match(/^0o[0-7]+/i)) { intLiteral = true; } | ||||
// Decimal | ||||
if (stream.match(/^[1-9]\d*(e[\+\-]?\d+)?/)) { | ||||
// Decimal literals may be "imaginary" | ||||
stream.eat(/J/i); | ||||
// TODO - Can you have imaginary longs? | ||||
intLiteral = true; | ||||
} | ||||
// Zero by itself with no other piece of number. | ||||
if (stream.match(/^0(?![\dx])/i)) { intLiteral = true; } | ||||
if (intLiteral) { | ||||
// Integer literals may be "long" | ||||
stream.eat(/L/i); | ||||
return 'number'; | ||||
} | ||||
} | ||||
Fernando Perez
|
r4934 | |||
Brian E. Granger
|
r4504 | // Handle Strings | ||
if (stream.match(stringPrefixes)) { | ||||
state.tokenize = tokenStringFactory(stream.current()); | ||||
return state.tokenize(stream, state); | ||||
} | ||||
Fernando Perez
|
r4934 | |||
Brian E. Granger
|
r4504 | // Handle operators and Delimiters | ||
if (stream.match(tripleDelimiters) || stream.match(doubleDelimiters)) { | ||||
return null; | ||||
} | ||||
if (stream.match(doubleOperators) | ||||
|| stream.match(singleOperators) | ||||
|| stream.match(wordOperators)) { | ||||
return 'operator'; | ||||
} | ||||
if (stream.match(singleDelimiters)) { | ||||
return null; | ||||
} | ||||
Fernando Perez
|
r4934 | |||
Brian E. Granger
|
r4504 | if (stream.match(types)) { | ||
return 'builtin'; | ||||
} | ||||
Fernando Perez
|
r4934 | |||
Brian E. Granger
|
r4504 | if (stream.match(keywords)) { | ||
return 'keyword'; | ||||
} | ||||
Fernando Perez
|
r4934 | |||
Brian E. Granger
|
r4504 | if (stream.match(identifiers)) { | ||
return 'variable'; | ||||
} | ||||
Fernando Perez
|
r4934 | |||
Brian E. Granger
|
r4504 | // Handle non-detected items | ||
stream.next(); | ||||
return ERRORCLASS; | ||||
} | ||||
Fernando Perez
|
r4934 | |||
Brian E. Granger
|
r4504 | function tokenStringFactory(delimiter) { | ||
Fernando Perez
|
r4933 | while ('rub'.indexOf(delimiter.charAt(0).toLowerCase()) >= 0) { | ||
Brian E. Granger
|
r4504 | delimiter = delimiter.substr(1); | ||
} | ||||
var singleline = delimiter.length == 1; | ||||
var OUTCLASS = 'string'; | ||||
Fernando Perez
|
r4934 | |||
Brian E. Granger
|
r4504 | return function tokenString(stream, state) { | ||
while (!stream.eol()) { | ||||
stream.eatWhile(/[^'"\\]/); | ||||
if (stream.eat('\\')) { | ||||
stream.next(); | ||||
if (singleline && stream.eol()) { | ||||
return OUTCLASS; | ||||
} | ||||
Fernando Perez
|
r4933 | } else if (stream.match(delimiter)) { | ||
Brian E. Granger
|
r4504 | state.tokenize = tokenBase; | ||
return OUTCLASS; | ||||
} else { | ||||
stream.eat(/['"]/); | ||||
} | ||||
} | ||||
if (singleline) { | ||||
Fernando Perez
|
r4933 | if (parserConf.singleLineStringErrors) { | ||
return ERRORCLASS; | ||||
Brian E. Granger
|
r4504 | } else { | ||
state.tokenize = tokenBase; | ||||
} | ||||
} | ||||
return OUTCLASS; | ||||
}; | ||||
} | ||||
Fernando Perez
|
r4934 | |||
Brian E. Granger
|
r4504 | function indent(stream, state, type) { | ||
type = type || 'py'; | ||||
var indentUnit = 0; | ||||
if (type === 'py') { | ||||
for (var i = 0; i < state.scopes.length; ++i) { | ||||
if (state.scopes[i].type === 'py') { | ||||
indentUnit = state.scopes[i].offset + conf.indentUnit; | ||||
break; | ||||
} | ||||
} | ||||
} else { | ||||
indentUnit = stream.column() + stream.current().length; | ||||
} | ||||
state.scopes.unshift({ | ||||
offset: indentUnit, | ||||
type: type | ||||
}); | ||||
} | ||||
Fernando Perez
|
r4934 | |||
Brian E. Granger
|
r4504 | function dedent(stream, state) { | ||
if (state.scopes.length == 1) return; | ||||
if (state.scopes[0].type === 'py') { | ||||
var _indent = stream.indentation(); | ||||
var _indent_index = -1; | ||||
for (var i = 0; i < state.scopes.length; ++i) { | ||||
if (_indent === state.scopes[i].offset) { | ||||
_indent_index = i; | ||||
break; | ||||
} | ||||
} | ||||
if (_indent_index === -1) { | ||||
return true; | ||||
} | ||||
while (state.scopes[0].offset !== _indent) { | ||||
state.scopes.shift(); | ||||
} | ||||
return false | ||||
} else { | ||||
state.scopes.shift(); | ||||
return false; | ||||
} | ||||
} | ||||
function tokenLexer(stream, state) { | ||||
indentInfo = null; | ||||
var style = state.tokenize(stream, state); | ||||
var current = stream.current(); | ||||
// Handle '.' connected identifiers | ||||
if (current === '.') { | ||||
style = state.tokenize(stream, state); | ||||
current = stream.current(); | ||||
if (style === 'variable') { | ||||
return 'variable'; | ||||
} else { | ||||
return ERRORCLASS; | ||||
} | ||||
} | ||||
Fernando Perez
|
r4934 | |||
Brian E. Granger
|
r4504 | // Handle decorators | ||
if (current === '@') { | ||||
style = state.tokenize(stream, state); | ||||
current = stream.current(); | ||||
if (style === 'variable' | ||||
|| current === '@staticmethod' | ||||
|| current === '@classmethod') { | ||||
return 'meta'; | ||||
} else { | ||||
return ERRORCLASS; | ||||
} | ||||
} | ||||
Fernando Perez
|
r4934 | |||
Brian E. Granger
|
r4504 | // Handle scope changes. | ||
if (current === 'pass' || current === 'return') { | ||||
state.dedent += 1; | ||||
} | ||||
if ((current === ':' && !state.lambda && state.scopes[0].type == 'py') | ||||
|| indentInfo === 'indent') { | ||||
indent(stream, state); | ||||
} | ||||
var delimiter_index = '[({'.indexOf(current); | ||||
if (delimiter_index !== -1) { | ||||
indent(stream, state, '])}'.slice(delimiter_index, delimiter_index+1)); | ||||
} | ||||
if (indentInfo === 'dedent') { | ||||
if (dedent(stream, state)) { | ||||
return ERRORCLASS; | ||||
} | ||||
} | ||||
delimiter_index = '])}'.indexOf(current); | ||||
if (delimiter_index !== -1) { | ||||
if (dedent(stream, state)) { | ||||
return ERRORCLASS; | ||||
} | ||||
} | ||||
if (state.dedent > 0 && stream.eol() && state.scopes[0].type == 'py') { | ||||
if (state.scopes.length > 1) state.scopes.shift(); | ||||
state.dedent -= 1; | ||||
} | ||||
Fernando Perez
|
r4934 | |||
Brian E. Granger
|
r4504 | return style; | ||
} | ||||
var external = { | ||||
startState: function(basecolumn) { | ||||
return { | ||||
tokenize: tokenBase, | ||||
scopes: [{offset:basecolumn || 0, type:'py'}], | ||||
lastToken: null, | ||||
lambda: false, | ||||
dedent: 0 | ||||
}; | ||||
}, | ||||
Fernando Perez
|
r4934 | |||
Brian E. Granger
|
r4504 | token: function(stream, state) { | ||
var style = tokenLexer(stream, state); | ||||
Fernando Perez
|
r4934 | |||
Brian E. Granger
|
r4504 | state.lastToken = {style:style, content: stream.current()}; | ||
Fernando Perez
|
r4934 | |||
Brian E. Granger
|
r4504 | if (stream.eol() && stream.lambda) { | ||
state.lambda = false; | ||||
} | ||||
Fernando Perez
|
r4934 | |||
Brian E. Granger
|
r4504 | return style; | ||
}, | ||||
Fernando Perez
|
r4934 | |||
Brian E. Granger
|
r4504 | indent: function(state, textAfter) { | ||
if (state.tokenize != tokenBase) { | ||||
return 0; | ||||
} | ||||
Fernando Perez
|
r4934 | |||
Brian E. Granger
|
r4504 | return state.scopes[0].offset; | ||
} | ||||
Fernando Perez
|
r4934 | |||
Brian E. Granger
|
r4504 | }; | ||
return external; | ||||
}); | ||||
CodeMirror.defineMIME("text/x-python", "python"); | ||||