highlight.py
75 lines
| 2.6 KiB
| text/x-python
|
PythonLexer
Martin Geisler
|
r8251 | # highlight.py - highlight extension implementation file | ||
# | ||||
# Copyright 2007-2009 Adam Hupp <adam@hupp.org> and others | ||||
# | ||||
# This software may be used and distributed according to the terms of the | ||||
Matt Mackall
|
r10263 | # GNU General Public License version 2 or any later version. | ||
Patrick Mezard
|
r6938 | # | ||
# The original module was split in an interface and an implementation | ||||
# file to defer pygments loading and speedup extension setup. | ||||
from mercurial import demandimport | ||||
Benoit Boissinot
|
r10394 | demandimport.ignore.extend(['pkgutil', 'pkg_resources', '__main__']) | ||
Matt Mackall
|
r7948 | from mercurial import util, encoding | ||
Patrick Mezard
|
r6938 | |||
from pygments import highlight | ||||
from pygments.util import ClassNotFound | ||||
from pygments.lexers import guess_lexer, guess_lexer_for_filename, TextLexer | ||||
from pygments.formatters import HtmlFormatter | ||||
SYNTAX_CSS = ('\n<link rel="stylesheet" href="{url}highlightcss" ' | ||||
'type="text/css" />') | ||||
Gregory Szorc
|
r26680 | def pygmentize(field, fctx, style, tmpl, guessfilenameonly=False): | ||
Patrick Mezard
|
r6938 | |||
# append a <link ...> to the syntax highlighting css | ||||
Matt Mackall
|
r10959 | old_header = tmpl.load('header') | ||
Patrick Mezard
|
r6938 | if SYNTAX_CSS not in old_header: | ||
new_header = old_header + SYNTAX_CSS | ||||
tmpl.cache['header'] = new_header | ||||
text = fctx.data() | ||||
if util.binary(text): | ||||
return | ||||
Matt Mackall
|
r23613 | # str.splitlines() != unicode.splitlines() because "reasons" | ||
for c in "\x0c\x1c\x1d\x1e": | ||||
if c in text: | ||||
text = text.replace(c, '') | ||||
Yuya Nishihara
|
r9424 | # Pygments is best used with Unicode strings: | ||
# <http://pygments.org/docs/unicode/> | ||||
text = text.decode(encoding.encoding, 'replace') | ||||
Christian Ebert
|
r7120 | |||
Patrick Mezard
|
r6938 | # To get multi-line strings right, we can't format line-by-line | ||
try: | ||||
Alexander Plavin
|
r19169 | lexer = guess_lexer_for_filename(fctx.path(), text[:1024], | ||
stripnl=False) | ||||
Patrick Mezard
|
r6938 | except (ClassNotFound, ValueError): | ||
Gregory Szorc
|
r26680 | # guess_lexer will return a lexer if *any* lexer matches. There is | ||
# no way to specify a minimum match score. This can give a high rate of | ||||
# false positives on files with an unknown filename pattern. | ||||
if guessfilenameonly: | ||||
return | ||||
Patrick Mezard
|
r6938 | try: | ||
Alexander Plavin
|
r19169 | lexer = guess_lexer(text[:1024], stripnl=False) | ||
Patrick Mezard
|
r6938 | except (ClassNotFound, ValueError): | ||
r25899 | # Don't highlight unknown files | |||
return | ||||
# Don't highlight text files | ||||
if isinstance(lexer, TextLexer): | ||||
return | ||||
Patrick Mezard
|
r6938 | |||
r25867 | formatter = HtmlFormatter(nowrap=True, style=style) | |||
Patrick Mezard
|
r6938 | |||
colorized = highlight(text, lexer, formatter) | ||||
Yuya Nishihara
|
r9424 | coloriter = (s.encode(encoding.encoding, 'replace') | ||
for s in colorized.splitlines()) | ||||
Patrick Mezard
|
r6938 | |||
Dirkjan Ochtman
|
r8360 | tmpl.filters['colorize'] = lambda x: coloriter.next() | ||
Patrick Mezard
|
r6938 | |||
oldl = tmpl.cache[field] | ||||
newl = oldl.replace('line|escape', 'line|colorize') | ||||
tmpl.cache[field] = newl | ||||