rhodecode-enterprise-ce Files · rhodecode/public/js/mode/xquery/xquery.js

helpers: unicode/str add flag to control usage of chardet....

helpers: unicode/str add flag to control usage of chardet. - in case it's somehow installed we still want to control the behaviour via explicit flag.

marcink - - Load All Authors

File last commit:

r4105:10488616 default


                r4109:19a6ab7e

default

Download file

             xquery.js
        
                    448 lines
            
             | 15.4 KiB
            
                | application/javascript
            
             |
                JavascriptLexer
            
             / rhodecode / public / js / mode / xquery / xquery.js
          
                    History
                
                 |
                  Annotation
                 | Raw
                 |Copy content
                 |Copy permalink

      // CodeMirror, copyright (c) by Marijn Haverbeke and others

      // Distributed under an MIT license: https://codemirror.net/LICENSE

      (function(mod) {

        if (typeof exports == "object" && typeof module == "object") // CommonJS

          mod(require("../../lib/codemirror"));

        else if (typeof define == "function" && define.amd) // AMD

          define(["../../lib/codemirror"], mod);

        else // Plain browser env

          mod(CodeMirror);

      })(function(CodeMirror) {

      "use strict";

      CodeMirror.defineMode("xquery", function() {

        // The keywords object is set to the result of this self executing

        // function. Each keyword is a property of the keywords object whose

        // value is {type: atype, style: astyle}

        var keywords = function(){

          // convenience functions used to build keywords object

          function kw(type) {return {type: type, style: "keyword"};}

          var operator = kw("operator")

            , atom = {type: "atom", style: "atom"}

            , punctuation = {type: "punctuation", style: null}

            , qualifier = {type: "axis_specifier", style: "qualifier"};

          // kwObj is what is return from this function at the end

          var kwObj = {

            ',': punctuation

          };

          // a list of 'basic' keywords. For each add a property to kwObj with the value of

          // {type: basic[i], style: "keyword"} e.g. 'after' --> {type: "after", style: "keyword"}

          var basic = ['after', 'all', 'allowing', 'ancestor', 'ancestor-or-self', 'any', 'array', 'as',

          'ascending', 'at', 'attribute', 'base-uri', 'before', 'boundary-space', 'by', 'case', 'cast',

          'castable', 'catch', 'child', 'collation', 'comment', 'construction', 'contains', 'content',

          'context', 'copy', 'copy-namespaces', 'count', 'decimal-format', 'declare', 'default', 'delete',

          'descendant', 'descendant-or-self', 'descending', 'diacritics', 'different', 'distance',

          'document', 'document-node', 'element', 'else', 'empty', 'empty-sequence', 'encoding', 'end',

          'entire', 'every', 'exactly', 'except', 'external', 'first', 'following', 'following-sibling',

          'for', 'from', 'ftand', 'ftnot', 'ft-option', 'ftor', 'function', 'fuzzy', 'greatest', 'group',

          'if', 'import', 'in', 'inherit', 'insensitive', 'insert', 'instance', 'intersect', 'into',

          'invoke', 'is', 'item', 'language', 'last', 'lax', 'least', 'let', 'levels', 'lowercase', 'map',

          'modify', 'module', 'most', 'namespace', 'next', 'no', 'node', 'nodes', 'no-inherit',

          'no-preserve', 'not', 'occurs', 'of', 'only', 'option', 'order', 'ordered', 'ordering',

          'paragraph', 'paragraphs', 'parent', 'phrase', 'preceding', 'preceding-sibling', 'preserve',

          'previous', 'processing-instruction', 'relationship', 'rename', 'replace', 'return',

          'revalidation', 'same', 'satisfies', 'schema', 'schema-attribute', 'schema-element', 'score',

          'self', 'sensitive', 'sentence', 'sentences', 'sequence', 'skip', 'sliding', 'some', 'stable',

          'start', 'stemming', 'stop', 'strict', 'strip', 'switch', 'text', 'then', 'thesaurus', 'times',

          'to', 'transform', 'treat', 'try', 'tumbling', 'type', 'typeswitch', 'union', 'unordered',

          'update', 'updating', 'uppercase', 'using', 'validate', 'value', 'variable', 'version',

          'weight', 'when', 'where', 'wildcards', 'window', 'with', 'without', 'word', 'words', 'xquery'];

          for(var i=0, l=basic.length; i < l; i++) { kwObj[basic[i]] = kw(basic[i]);};

          // a list of types. For each add a property to kwObj with the value of

          // {type: "atom", style: "atom"}

          var types = ['xs:anyAtomicType', 'xs:anySimpleType', 'xs:anyType', 'xs:anyURI',

          'xs:base64Binary', 'xs:boolean', 'xs:byte', 'xs:date', 'xs:dateTime', 'xs:dateTimeStamp',

          'xs:dayTimeDuration', 'xs:decimal', 'xs:double', 'xs:duration', 'xs:ENTITIES', 'xs:ENTITY',

          'xs:float', 'xs:gDay', 'xs:gMonth', 'xs:gMonthDay', 'xs:gYear', 'xs:gYearMonth', 'xs:hexBinary',

          'xs:ID', 'xs:IDREF', 'xs:IDREFS', 'xs:int', 'xs:integer', 'xs:item', 'xs:java', 'xs:language',

          'xs:long', 'xs:Name', 'xs:NCName', 'xs:negativeInteger', 'xs:NMTOKEN', 'xs:NMTOKENS',

          'xs:nonNegativeInteger', 'xs:nonPositiveInteger', 'xs:normalizedString', 'xs:NOTATION',

          'xs:numeric', 'xs:positiveInteger', 'xs:precisionDecimal', 'xs:QName', 'xs:short', 'xs:string',

          'xs:time', 'xs:token', 'xs:unsignedByte', 'xs:unsignedInt', 'xs:unsignedLong',

          'xs:unsignedShort', 'xs:untyped', 'xs:untypedAtomic', 'xs:yearMonthDuration'];

          for(var i=0, l=types.length; i < l; i++) { kwObj[types[i]] = atom;};

          // each operator will add a property to kwObj with value of {type: "operator", style: "keyword"}

          var operators = ['eq', 'ne', 'lt', 'le', 'gt', 'ge', ':=', '=', '>', '>=', '<', '<=', '.', '|', '?', 'and', 'or', 'div', 'idiv', 'mod', '*', '/', '+', '-'];

          for(var i=0, l=operators.length; i < l; i++) { kwObj[operators[i]] = operator;};

          // each axis_specifiers will add a property to kwObj with value of {type: "axis_specifier", style: "qualifier"}

          var axis_specifiers = ["self::", "attribute::", "child::", "descendant::", "descendant-or-self::", "parent::",

          "ancestor::", "ancestor-or-self::", "following::", "preceding::", "following-sibling::", "preceding-sibling::"];

          for(var i=0, l=axis_specifiers.length; i < l; i++) { kwObj[axis_specifiers[i]] = qualifier; };

          return kwObj;

        }();

        function chain(stream, state, f) {

          state.tokenize = f;

          return f(stream, state);

        }

        // the primary mode tokenizer

        function tokenBase(stream, state) {

          var ch = stream.next(),

              mightBeFunction = false,

              isEQName = isEQNameAhead(stream);

          // an XML tag (if not in some sub, chained tokenizer)

          if (ch == "<") {

            if(stream.match("!--", true))

              return chain(stream, state, tokenXMLComment);

            if(stream.match("![CDATA", false)) {

              state.tokenize = tokenCDATA;

              return "tag";

            }

            if(stream.match("?", false)) {

              return chain(stream, state, tokenPreProcessing);

            }

            var isclose = stream.eat("/");

            stream.eatSpace();

            var tagName = "", c;

            while ((c = stream.eat(/[^\s\u00a0=<>\"\'\/?]/))) tagName += c;

            return chain(stream, state, tokenTag(tagName, isclose));

          }

          // start code block

          else if(ch == "{") {

            pushStateStack(state, { type: "codeblock"});

            return null;

          }

          // end code block

          else if(ch == "}") {

            popStateStack(state);

            return null;

          }

          // if we're in an XML block

          else if(isInXmlBlock(state)) {

            if(ch == ">")

              return "tag";

            else if(ch == "/" && stream.eat(">")) {

              popStateStack(state);

              return "tag";

            }

            else

              return "variable";

          }

          // if a number

          else if (/\d/.test(ch)) {

            stream.match(/^\d*(?:\.\d*)?(?:E[+\-]?\d+)?/);

            return "atom";

          }

          // comment start

          else if (ch === "(" && stream.eat(":")) {

            pushStateStack(state, { type: "comment"});

            return chain(stream, state, tokenComment);

          }

          // quoted string

          else if (!isEQName && (ch === '"' || ch === "'"))

            return chain(stream, state, tokenString(ch));

          // variable

          else if(ch === "$") {

            return chain(stream, state, tokenVariable);

          }

          // assignment

          else if(ch ===":" && stream.eat("=")) {

            return "keyword";

          }

          // open paren

          else if(ch === "(") {

            pushStateStack(state, { type: "paren"});

            return null;

          }

          // close paren

          else if(ch === ")") {

            popStateStack(state);

            return null;

          }

          // open paren

          else if(ch === "[") {

            pushStateStack(state, { type: "bracket"});

            return null;

          }

          // close paren

          else if(ch === "]") {

            popStateStack(state);

            return null;

          }

          else {

            var known = keywords.propertyIsEnumerable(ch) && keywords[ch];

            // if there's a EQName ahead, consume the rest of the string portion, it's likely a function

            if(isEQName && ch === '\"') while(stream.next() !== '"'){}

            if(isEQName && ch === '\'') while(stream.next() !== '\''){}

            // gobble up a word if the character is not known

            if(!known) stream.eatWhile(/[\w\$_-]/);

            // gobble a colon in the case that is a lib func type call fn:doc

            var foundColon = stream.eat(":");

            // if there's not a second colon, gobble another word. Otherwise, it's probably an axis specifier

            // which should get matched as a keyword

            if(!stream.eat(":") && foundColon) {

              stream.eatWhile(/[\w\$_-]/);

            }

            // if the next non whitespace character is an open paren, this is probably a function (if not a keyword of other sort)

            if(stream.match(/^[ \t]*\(/, false)) {

              mightBeFunction = true;

            }

            // is the word a keyword?

            var word = stream.current();

            known = keywords.propertyIsEnumerable(word) && keywords[word];

            // if we think it's a function call but not yet known,

            // set style to variable for now for lack of something better

            if(mightBeFunction && !known) known = {type: "function_call", style: "variable def"};

            // if the previous word was element, attribute, axis specifier, this word should be the name of that

            if(isInXmlConstructor(state)) {

              popStateStack(state);

              return "variable";

            }

            // as previously checked, if the word is element,attribute, axis specifier, call it an "xmlconstructor" and

            // push the stack so we know to look for it on the next word

            if(word == "element" || word == "attribute" || known.type == "axis_specifier") pushStateStack(state, {type: "xmlconstructor"});

            // if the word is known, return the details of that else just call this a generic 'word'

            return known ? known.style : "variable";

          }

        }

        // handle comments, including nested

        function tokenComment(stream, state) {

          var maybeEnd = false, maybeNested = false, nestedCount = 0, ch;

          while (ch = stream.next()) {

            if (ch == ")" && maybeEnd) {

              if(nestedCount > 0)

                nestedCount--;

              else {

                popStateStack(state);

                break;

              }

            }

            else if(ch == ":" && maybeNested) {

              nestedCount++;

            }

            maybeEnd = (ch == ":");

            maybeNested = (ch == "(");

          }

          return "comment";

        }

        // tokenizer for string literals

        // optionally pass a tokenizer function to set state.tokenize back to when finished

        function tokenString(quote, f) {

          return function(stream, state) {

            var ch;

            if(isInString(state) && stream.current() == quote) {

              popStateStack(state);

              if(f) state.tokenize = f;

              return "string";

            }

            pushStateStack(state, { type: "string", name: quote, tokenize: tokenString(quote, f) });

            // if we're in a string and in an XML block, allow an embedded code block

            if(stream.match("{", false) && isInXmlAttributeBlock(state)) {

              state.tokenize = tokenBase;

              return "string";

            }

            while (ch = stream.next()) {

              if (ch ==  quote) {

                popStateStack(state);

                if(f) state.tokenize = f;

                break;

              }

              else {

                // if we're in a string and in an XML block, allow an embedded code block in an attribute

                if(stream.match("{", false) && isInXmlAttributeBlock(state)) {

                  state.tokenize = tokenBase;

                  return "string";

                }

              }

            }

            return "string";

          };

        }

        // tokenizer for variables

        function tokenVariable(stream, state) {

          var isVariableChar = /[\w\$_-]/;

          // a variable may start with a quoted EQName so if the next character is quote, consume to the next quote

          if(stream.eat("\"")) {

            while(stream.next() !== '\"'){};

            stream.eat(":");

          } else {

            stream.eatWhile(isVariableChar);

            if(!stream.match(":=", false)) stream.eat(":");

          }

          stream.eatWhile(isVariableChar);

          state.tokenize = tokenBase;

          return "variable";

        }

        // tokenizer for XML tags

        function tokenTag(name, isclose) {

          return function(stream, state) {

            stream.eatSpace();

            if(isclose && stream.eat(">")) {

              popStateStack(state);

              state.tokenize = tokenBase;

              return "tag";

            }

            // self closing tag without attributes?

            if(!stream.eat("/"))

              pushStateStack(state, { type: "tag", name: name, tokenize: tokenBase});

            if(!stream.eat(">")) {

              state.tokenize = tokenAttribute;

              return "tag";

            }

            else {

              state.tokenize = tokenBase;

            }

            return "tag";

          };

        }

        // tokenizer for XML attributes

        function tokenAttribute(stream, state) {

          var ch = stream.next();

          if(ch == "/" && stream.eat(">")) {

            if(isInXmlAttributeBlock(state)) popStateStack(state);

            if(isInXmlBlock(state)) popStateStack(state);

            return "tag";

          }

          if(ch == ">") {

            if(isInXmlAttributeBlock(state)) popStateStack(state);

            return "tag";

          }

          if(ch == "=")

            return null;

          // quoted string

          if (ch == '"' || ch == "'")

            return chain(stream, state, tokenString(ch, tokenAttribute));

          if(!isInXmlAttributeBlock(state))

            pushStateStack(state, { type: "attribute", tokenize: tokenAttribute});

          stream.eat(/[a-zA-Z_:]/);

          stream.eatWhile(/[-a-zA-Z0-9_:.]/);

          stream.eatSpace();

          // the case where the attribute has not value and the tag was closed

          if(stream.match(">", false) || stream.match("/", false)) {

            popStateStack(state);

            state.tokenize = tokenBase;

          }

          return "attribute";

        }

        // handle comments, including nested

        function tokenXMLComment(stream, state) {

          var ch;

          while (ch = stream.next()) {

            if (ch == "-" && stream.match("->", true)) {

              state.tokenize = tokenBase;

              return "comment";

            }

          }

        }

        // handle CDATA

        function tokenCDATA(stream, state) {

          var ch;

          while (ch = stream.next()) {

            if (ch == "]" && stream.match("]", true)) {

              state.tokenize = tokenBase;

              return "comment";

            }

          }

        }

        // handle preprocessing instructions

        function tokenPreProcessing(stream, state) {

          var ch;

          while (ch = stream.next()) {

            if (ch == "?" && stream.match(">", true)) {

              state.tokenize = tokenBase;

              return "comment meta";

            }

          }

        }

        // functions to test the current context of the state

        function isInXmlBlock(state) { return isIn(state, "tag"); }

        function isInXmlAttributeBlock(state) { return isIn(state, "attribute"); }

        function isInXmlConstructor(state) { return isIn(state, "xmlconstructor"); }

        function isInString(state) { return isIn(state, "string"); }

        function isEQNameAhead(stream) {

          // assume we've already eaten a quote (")

          if(stream.current() === '"')

            return stream.match(/^[^\"]+\"\:/, false);

          else if(stream.current() === '\'')

            return stream.match(/^[^\"]+\'\:/, false);

          else

            return false;

        }

        function isIn(state, type) {

          return (state.stack.length && state.stack[state.stack.length - 1].type == type);

        }

        function pushStateStack(state, newState) {

          state.stack.push(newState);

        }

        function popStateStack(state) {

          state.stack.pop();

          var reinstateTokenize = state.stack.length && state.stack[state.stack.length-1].tokenize;

          state.tokenize = reinstateTokenize || tokenBase;

        }

        // the interface for the mode API

        return {

          startState: function() {

            return {

              tokenize: tokenBase,

              cc: [],

              stack: []

            };

          },

          token: function(stream, state) {

            if (stream.eatSpace()) return null;

            var style = state.tokenize(stream, state);

            return style;

          },

          blockCommentStart: "(:",

          blockCommentEnd: ":)"

        };

      });

      CodeMirror.defineMIME("application/xquery", "xquery");

      });

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages

				// CodeMirror, copyright (c) by Marijn Haverbeke and others
				// Distributed under an MIT license: https://codemirror.net/LICENSE

				(function(mod) {
				if (typeof exports == "object" && typeof module == "object") // CommonJS
				mod(require("../../lib/codemirror"));
				else if (typeof define == "function" && define.amd) // AMD
				define(["../../lib/codemirror"], mod);
				else // Plain browser env
				mod(CodeMirror);
				})(function(CodeMirror) {
				"use strict";

				CodeMirror.defineMode("xquery", function() {

				// The keywords object is set to the result of this self executing
				// function. Each keyword is a property of the keywords object whose
				// value is {type: atype, style: astyle}
				var keywords = function(){
				// convenience functions used to build keywords object
				function kw(type) {return {type: type, style: "keyword"};}
				var operator = kw("operator")
				, atom = {type: "atom", style: "atom"}
				, punctuation = {type: "punctuation", style: null}
				, qualifier = {type: "axis_specifier", style: "qualifier"};

				// kwObj is what is return from this function at the end
				var kwObj = {
				',': punctuation
				};

				// a list of 'basic' keywords. For each add a property to kwObj with the value of
				// {type: basic[i], style: "keyword"} e.g. 'after' --> {type: "after", style: "keyword"}
				var basic = ['after', 'all', 'allowing', 'ancestor', 'ancestor-or-self', 'any', 'array', 'as',
				'ascending', 'at', 'attribute', 'base-uri', 'before', 'boundary-space', 'by', 'case', 'cast',
				'castable', 'catch', 'child', 'collation', 'comment', 'construction', 'contains', 'content',
				'context', 'copy', 'copy-namespaces', 'count', 'decimal-format', 'declare', 'default', 'delete',
				'descendant', 'descendant-or-self', 'descending', 'diacritics', 'different', 'distance',
				'document', 'document-node', 'element', 'else', 'empty', 'empty-sequence', 'encoding', 'end',
				'entire', 'every', 'exactly', 'except', 'external', 'first', 'following', 'following-sibling',
				'for', 'from', 'ftand', 'ftnot', 'ft-option', 'ftor', 'function', 'fuzzy', 'greatest', 'group',
				'if', 'import', 'in', 'inherit', 'insensitive', 'insert', 'instance', 'intersect', 'into',
				'invoke', 'is', 'item', 'language', 'last', 'lax', 'least', 'let', 'levels', 'lowercase', 'map',
				'modify', 'module', 'most', 'namespace', 'next', 'no', 'node', 'nodes', 'no-inherit',
				'no-preserve', 'not', 'occurs', 'of', 'only', 'option', 'order', 'ordered', 'ordering',
				'paragraph', 'paragraphs', 'parent', 'phrase', 'preceding', 'preceding-sibling', 'preserve',
				'previous', 'processing-instruction', 'relationship', 'rename', 'replace', 'return',
				'revalidation', 'same', 'satisfies', 'schema', 'schema-attribute', 'schema-element', 'score',
				'self', 'sensitive', 'sentence', 'sentences', 'sequence', 'skip', 'sliding', 'some', 'stable',
				'start', 'stemming', 'stop', 'strict', 'strip', 'switch', 'text', 'then', 'thesaurus', 'times',
				'to', 'transform', 'treat', 'try', 'tumbling', 'type', 'typeswitch', 'union', 'unordered',
				'update', 'updating', 'uppercase', 'using', 'validate', 'value', 'variable', 'version',
				'weight', 'when', 'where', 'wildcards', 'window', 'with', 'without', 'word', 'words', 'xquery'];
				for(var i=0, l=basic.length; i < l; i++) { kwObj[basic[i]] = kw(basic[i]);};

				// a list of types. For each add a property to kwObj with the value of
				// {type: "atom", style: "atom"}
				var types = ['xs:anyAtomicType', 'xs:anySimpleType', 'xs:anyType', 'xs:anyURI',
				'xs:base64Binary', 'xs:boolean', 'xs:byte', 'xs:date', 'xs:dateTime', 'xs:dateTimeStamp',
				'xs:dayTimeDuration', 'xs:decimal', 'xs:double', 'xs:duration', 'xs:ENTITIES', 'xs:ENTITY',
				'xs:float', 'xs:gDay', 'xs:gMonth', 'xs:gMonthDay', 'xs:gYear', 'xs:gYearMonth', 'xs:hexBinary',
				'xs:ID', 'xs:IDREF', 'xs:IDREFS', 'xs:int', 'xs:integer', 'xs:item', 'xs:java', 'xs:language',
				'xs:long', 'xs:Name', 'xs:NCName', 'xs:negativeInteger', 'xs:NMTOKEN', 'xs:NMTOKENS',
				'xs:nonNegativeInteger', 'xs:nonPositiveInteger', 'xs:normalizedString', 'xs:NOTATION',
				'xs:numeric', 'xs:positiveInteger', 'xs:precisionDecimal', 'xs:QName', 'xs:short', 'xs:string',
				'xs:time', 'xs:token', 'xs:unsignedByte', 'xs:unsignedInt', 'xs:unsignedLong',
				'xs:unsignedShort', 'xs:untyped', 'xs:untypedAtomic', 'xs:yearMonthDuration'];
				for(var i=0, l=types.length; i < l; i++) { kwObj[types[i]] = atom;};

				// each operator will add a property to kwObj with value of {type: "operator", style: "keyword"}
				var operators = ['eq', 'ne', 'lt', 'le', 'gt', 'ge', ':=', '=', '>', '>=', '<', '<=', '.', '\|', '?', 'and', 'or', 'div', 'idiv', 'mod', '*', '/', '+', '-'];
				for(var i=0, l=operators.length; i < l; i++) { kwObj[operators[i]] = operator;};

				// each axis_specifiers will add a property to kwObj with value of {type: "axis_specifier", style: "qualifier"}
				var axis_specifiers = ["self::", "attribute::", "child::", "descendant::", "descendant-or-self::", "parent::",
				"ancestor::", "ancestor-or-self::", "following::", "preceding::", "following-sibling::", "preceding-sibling::"];
				for(var i=0, l=axis_specifiers.length; i < l; i++) { kwObj[axis_specifiers[i]] = qualifier; };

				return kwObj;
				}();

				function chain(stream, state, f) {
				state.tokenize = f;
				return f(stream, state);
				}

				// the primary mode tokenizer
				function tokenBase(stream, state) {
				var ch = stream.next(),
				mightBeFunction = false,
				isEQName = isEQNameAhead(stream);

				// an XML tag (if not in some sub, chained tokenizer)
				if (ch == "<") {
				if(stream.match("!--", true))
				return chain(stream, state, tokenXMLComment);

				if(stream.match("![CDATA", false)) {
				state.tokenize = tokenCDATA;
				return "tag";
				}

				if(stream.match("?", false)) {
				return chain(stream, state, tokenPreProcessing);
				}

				var isclose = stream.eat("/");
				stream.eatSpace();
				var tagName = "", c;
				while ((c = stream.eat(/[^\s\u00a0=<>\"\'\/?]/))) tagName += c;

				return chain(stream, state, tokenTag(tagName, isclose));
				}
				// start code block
				else if(ch == "{") {
				pushStateStack(state, { type: "codeblock"});
				return null;
				}
				// end code block
				else if(ch == "}") {
				popStateStack(state);
				return null;
				}
				// if we're in an XML block
				else if(isInXmlBlock(state)) {
				if(ch == ">")
				return "tag";
				else if(ch == "/" && stream.eat(">")) {
				popStateStack(state);
				return "tag";
				}
				else
				return "variable";
				}
				// if a number
				else if (/\d/.test(ch)) {
				stream.match(/^\d(?:\.\d)?(?:E[+\-]?\d+)?/);
				return "atom";
				}
				// comment start
				else if (ch === "(" && stream.eat(":")) {
				pushStateStack(state, { type: "comment"});
				return chain(stream, state, tokenComment);
				}
				// quoted string
				else if (!isEQName && (ch === '"' \|\| ch === "'"))
				return chain(stream, state, tokenString(ch));
				// variable
				else if(ch === "$") {
				return chain(stream, state, tokenVariable);
				}
				// assignment
				else if(ch ===":" && stream.eat("=")) {
				return "keyword";
				}
				// open paren
				else if(ch === "(") {
				pushStateStack(state, { type: "paren"});
				return null;
				}
				// close paren
				else if(ch === ")") {
				popStateStack(state);
				return null;
				}
				// open paren
				else if(ch === "[") {
				pushStateStack(state, { type: "bracket"});
				return null;
				}
				// close paren
				else if(ch === "]") {
				popStateStack(state);
				return null;
				}
				else {
				var known = keywords.propertyIsEnumerable(ch) && keywords[ch];

				// if there's a EQName ahead, consume the rest of the string portion, it's likely a function
				if(isEQName && ch === '\"') while(stream.next() !== '"'){}
				if(isEQName && ch === '\'') while(stream.next() !== '\''){}

				// gobble up a word if the character is not known
				if(!known) stream.eatWhile(/[\w\$_-]/);

				// gobble a colon in the case that is a lib func type call fn:doc
				var foundColon = stream.eat(":");

				// if there's not a second colon, gobble another word. Otherwise, it's probably an axis specifier
				// which should get matched as a keyword
				if(!stream.eat(":") && foundColon) {
				stream.eatWhile(/[\w\$_-]/);
				}
				// if the next non whitespace character is an open paren, this is probably a function (if not a keyword of other sort)
				if(stream.match(/^[ \t]*\(/, false)) {
				mightBeFunction = true;
				}
				// is the word a keyword?
				var word = stream.current();
				known = keywords.propertyIsEnumerable(word) && keywords[word];

				// if we think it's a function call but not yet known,
				// set style to variable for now for lack of something better
				if(mightBeFunction && !known) known = {type: "function_call", style: "variable def"};

				// if the previous word was element, attribute, axis specifier, this word should be the name of that
				if(isInXmlConstructor(state)) {
				popStateStack(state);
				return "variable";
				}
				// as previously checked, if the word is element,attribute, axis specifier, call it an "xmlconstructor" and
				// push the stack so we know to look for it on the next word
				if(word == "element" \|\| word == "attribute" \|\| known.type == "axis_specifier") pushStateStack(state, {type: "xmlconstructor"});

				// if the word is known, return the details of that else just call this a generic 'word'
				return known ? known.style : "variable";
				}
				}

				// handle comments, including nested
				function tokenComment(stream, state) {
				var maybeEnd = false, maybeNested = false, nestedCount = 0, ch;
				while (ch = stream.next()) {
				if (ch == ")" && maybeEnd) {
				if(nestedCount > 0)
				nestedCount--;
				else {
				popStateStack(state);
				break;
				}
				}
				else if(ch == ":" && maybeNested) {
				nestedCount++;
				}
				maybeEnd = (ch == ":");
				maybeNested = (ch == "(");
				}

				return "comment";
				}

				// tokenizer for string literals
				// optionally pass a tokenizer function to set state.tokenize back to when finished
				function tokenString(quote, f) {
				return function(stream, state) {
				var ch;

				if(isInString(state) && stream.current() == quote) {
				popStateStack(state);
				if(f) state.tokenize = f;
				return "string";
				}

				pushStateStack(state, { type: "string", name: quote, tokenize: tokenString(quote, f) });

				// if we're in a string and in an XML block, allow an embedded code block
				if(stream.match("{", false) && isInXmlAttributeBlock(state)) {
				state.tokenize = tokenBase;
				return "string";
				}


				while (ch = stream.next()) {
				if (ch == quote) {
				popStateStack(state);
				if(f) state.tokenize = f;
				break;
				}
				else {
				// if we're in a string and in an XML block, allow an embedded code block in an attribute
				if(stream.match("{", false) && isInXmlAttributeBlock(state)) {
				state.tokenize = tokenBase;
				return "string";
				}

				}
				}

				return "string";
				};
				}

				// tokenizer for variables
				function tokenVariable(stream, state) {
				var isVariableChar = /[\w\$_-]/;

				// a variable may start with a quoted EQName so if the next character is quote, consume to the next quote
				if(stream.eat("\"")) {
				while(stream.next() !== '\"'){};
				stream.eat(":");
				} else {
				stream.eatWhile(isVariableChar);
				if(!stream.match(":=", false)) stream.eat(":");
				}
				stream.eatWhile(isVariableChar);
				state.tokenize = tokenBase;
				return "variable";
				}

				// tokenizer for XML tags
				function tokenTag(name, isclose) {
				return function(stream, state) {
				stream.eatSpace();
				if(isclose && stream.eat(">")) {
				popStateStack(state);
				state.tokenize = tokenBase;
				return "tag";
				}
				// self closing tag without attributes?
				if(!stream.eat("/"))
				pushStateStack(state, { type: "tag", name: name, tokenize: tokenBase});
				if(!stream.eat(">")) {
				state.tokenize = tokenAttribute;
				return "tag";
				}
				else {
				state.tokenize = tokenBase;
				}
				return "tag";
				};
				}

				// tokenizer for XML attributes
				function tokenAttribute(stream, state) {
				var ch = stream.next();

				if(ch == "/" && stream.eat(">")) {
				if(isInXmlAttributeBlock(state)) popStateStack(state);
				if(isInXmlBlock(state)) popStateStack(state);
				return "tag";
				}
				if(ch == ">") {
				if(isInXmlAttributeBlock(state)) popStateStack(state);
				return "tag";
				}
				if(ch == "=")
				return null;
				// quoted string
				if (ch == '"' \|\| ch == "'")
				return chain(stream, state, tokenString(ch, tokenAttribute));

				if(!isInXmlAttributeBlock(state))
				pushStateStack(state, { type: "attribute", tokenize: tokenAttribute});

				stream.eat(/[a-zA-Z_:]/);
				stream.eatWhile(/[-a-zA-Z0-9_:.]/);
				stream.eatSpace();

				// the case where the attribute has not value and the tag was closed
				if(stream.match(">", false) \|\| stream.match("/", false)) {
				popStateStack(state);
				state.tokenize = tokenBase;
				}

				return "attribute";
				}

				// handle comments, including nested
				function tokenXMLComment(stream, state) {
				var ch;
				while (ch = stream.next()) {
				if (ch == "-" && stream.match("->", true)) {
				state.tokenize = tokenBase;
				return "comment";
				}
				}
				}


				// handle CDATA
				function tokenCDATA(stream, state) {
				var ch;
				while (ch = stream.next()) {
				if (ch == "]" && stream.match("]", true)) {
				state.tokenize = tokenBase;
				return "comment";
				}
				}
				}

				// handle preprocessing instructions
				function tokenPreProcessing(stream, state) {
				var ch;
				while (ch = stream.next()) {
				if (ch == "?" && stream.match(">", true)) {
				state.tokenize = tokenBase;
				return "comment meta";
				}
				}
				}


				// functions to test the current context of the state
				function isInXmlBlock(state) { return isIn(state, "tag"); }
				function isInXmlAttributeBlock(state) { return isIn(state, "attribute"); }
				function isInXmlConstructor(state) { return isIn(state, "xmlconstructor"); }
				function isInString(state) { return isIn(state, "string"); }

				function isEQNameAhead(stream) {
				// assume we've already eaten a quote (")
				if(stream.current() === '"')
				return stream.match(/^[^\"]+\"\:/, false);
				else if(stream.current() === '\'')
				return stream.match(/^[^\"]+\'\:/, false);
				else
				return false;
				}

				function isIn(state, type) {
				return (state.stack.length && state.stack[state.stack.length - 1].type == type);
				}

				function pushStateStack(state, newState) {
				state.stack.push(newState);
				}

				function popStateStack(state) {
				state.stack.pop();
				var reinstateTokenize = state.stack.length && state.stack[state.stack.length-1].tokenize;
				state.tokenize = reinstateTokenize \|\| tokenBase;
				}

				// the interface for the mode API
				return {
				startState: function() {
				return {
				tokenize: tokenBase,
				cc: [],
				stack: []
				};
				},

				token: function(stream, state) {
				if (stream.eatSpace()) return null;
				var style = state.tokenize(stream, state);
				return style;
				},

				blockCommentStart: "(:",
				blockCommentEnd: ":)"

				};

				});

				CodeMirror.defineMIME("application/xquery", "xquery");

				});