upstream/mercurial-mirror Files · hgext/highlight/highlight.py

manifest: skip fastdelta if the change is large...

manifest: skip fastdelta if the change is large In large repos, the existing manifest fastdelta computation (which performs a bisect on the raw manifest for every file that is changing), is excessively slow. This patch makes fastdelta fallback to the normal string delta algorithm if the number of changes is large. On a large repo with a commit of 8000 files, this reduces the commit time by 7 seconds (fastdelta goes from 8 seconds to 1). I tested this change by modifying the function to compare the old and the new values and running the test suite. The only difference is that the pure text-diff algorithm sometimes produces smaller (but functionaly identical) deltatexts than the bisect algorithm.

Gregory Szorc - - Load All Authors

File last commit:

r26680:7a3f6490 default


                r26871:1cbf144f

default

Download file

             highlight.py
        
                    75 lines
            
             | 2.6 KiB
            
                | text/x-python
            
             |
                PythonLexer
            
             / hgext / highlight / highlight.py
          
                    History
                
                 |
                  Annotation
                 | Raw
                 |Copy content
                 |Copy permalink

      # highlight.py - highlight extension implementation file

      #

      #  Copyright 2007-2009 Adam Hupp <adam@hupp.org> and others

      #

      # This software may be used and distributed according to the terms of the

      # GNU General Public License version 2 or any later version.

      #

      # The original module was split in an interface and an implementation

      # file to defer pygments loading and speedup extension setup.

      from mercurial import demandimport

      demandimport.ignore.extend(['pkgutil', 'pkg_resources', '__main__'])

      from mercurial import util, encoding

      from pygments import highlight

      from pygments.util import ClassNotFound

      from pygments.lexers import guess_lexer, guess_lexer_for_filename, TextLexer

      from pygments.formatters import HtmlFormatter

      SYNTAX_CSS = ('\n<link rel="stylesheet" href="{url}highlightcss" '

                    'type="text/css" />')

      def pygmentize(field, fctx, style, tmpl, guessfilenameonly=False):

          # append a <link ...> to the syntax highlighting css

          old_header = tmpl.load('header')

          if SYNTAX_CSS not in old_header:

              new_header =  old_header + SYNTAX_CSS

              tmpl.cache['header'] = new_header

          text = fctx.data()

          if util.binary(text):

              return

          # str.splitlines() != unicode.splitlines() because "reasons"

          for c in "\x0c\x1c\x1d\x1e":

              if c in text:

                  text = text.replace(c, '')

          # Pygments is best used with Unicode strings:

          # <http://pygments.org/docs/unicode/>

          text = text.decode(encoding.encoding, 'replace')

          # To get multi-line strings right, we can't format line-by-line

          try:

              lexer = guess_lexer_for_filename(fctx.path(), text[:1024],

                                               stripnl=False)

          except (ClassNotFound, ValueError):

              # guess_lexer will return a lexer if *any* lexer matches. There is

              # no way to specify a minimum match score. This can give a high rate of

              # false positives on files with an unknown filename pattern.

              if guessfilenameonly:

                  return

              try:

                  lexer = guess_lexer(text[:1024], stripnl=False)

              except (ClassNotFound, ValueError):

                  # Don't highlight unknown files

                  return

          # Don't highlight text files

          if isinstance(lexer, TextLexer):

              return

          formatter = HtmlFormatter(nowrap=True, style=style)

          colorized = highlight(text, lexer, formatter)

          coloriter = (s.encode(encoding.encoding, 'replace')

                       for s in colorized.splitlines())

          tmpl.filters['colorize'] = lambda x: coloriter.next()

          oldl = tmpl.cache[field]

          newl = oldl.replace('line|escape', 'line|colorize')

          tmpl.cache[field] = newl

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages

				# highlight.py - highlight extension implementation file
				#
				# Copyright 2007-2009 Adam Hupp <adam@hupp.org> and others
				#
				# This software may be used and distributed according to the terms of the
				# GNU General Public License version 2 or any later version.
				#
				# The original module was split in an interface and an implementation
				# file to defer pygments loading and speedup extension setup.

				from mercurial import demandimport
				demandimport.ignore.extend(['pkgutil', 'pkg_resources', '__main__'])
				from mercurial import util, encoding

				from pygments import highlight
				from pygments.util import ClassNotFound
				from pygments.lexers import guess_lexer, guess_lexer_for_filename, TextLexer
				from pygments.formatters import HtmlFormatter

				SYNTAX_CSS = ('\n<link rel="stylesheet" href="{url}highlightcss" '
				'type="text/css" />')

				def pygmentize(field, fctx, style, tmpl, guessfilenameonly=False):

				# append a <link ...> to the syntax highlighting css
				old_header = tmpl.load('header')
				if SYNTAX_CSS not in old_header:
				new_header = old_header + SYNTAX_CSS
				tmpl.cache['header'] = new_header

				text = fctx.data()
				if util.binary(text):
				return

				# str.splitlines() != unicode.splitlines() because "reasons"
				for c in "\x0c\x1c\x1d\x1e":
				if c in text:
				text = text.replace(c, '')

				# Pygments is best used with Unicode strings:
				# <http://pygments.org/docs/unicode/>
				text = text.decode(encoding.encoding, 'replace')

				# To get multi-line strings right, we can't format line-by-line
				try:
				lexer = guess_lexer_for_filename(fctx.path(), text[:1024],
				stripnl=False)
				except (ClassNotFound, ValueError):
				# guess_lexer will return a lexer if any lexer matches. There is
				# no way to specify a minimum match score. This can give a high rate of
				# false positives on files with an unknown filename pattern.
				if guessfilenameonly:
				return

				try:
				lexer = guess_lexer(text[:1024], stripnl=False)
				except (ClassNotFound, ValueError):
				# Don't highlight unknown files
				return

				# Don't highlight text files
				if isinstance(lexer, TextLexer):
				return

				formatter = HtmlFormatter(nowrap=True, style=style)

				colorized = highlight(text, lexer, formatter)
				coloriter = (s.encode(encoding.encoding, 'replace')
				for s in colorized.splitlines())

				tmpl.filters['colorize'] = lambda x: coloriter.next()

				oldl = tmpl.cache[field]
				newl = oldl.replace('line\|escape', 'line\|colorize')
				tmpl.cache[field] = newl