u/ewong/rhodecode-enterprise-ce-fork Files · rhodecode/lib/markup_renderer.py

license: updated copyright year to 2017

marcink - - Load All Authors

File last commit:

r1271:47a44c03 default


                r1271:47a44c03

default

Download file

             markup_renderer.py
        
                    273 lines
            
             | 9.4 KiB
            
                | text/x-python
            
             |
                PythonLexer
            
             / rhodecode / lib / markup_renderer.py
          
                    History
                
                 |
                  Source
                 | Raw
                 |Copy content
                 |Copy permalink

        marcink
    
project: added all source files and assets

              r1
            
      # -*- coding: utf-8 -*-

        marcink
    
license: updated copyright year to 2017

              r1271
            
      # Copyright (C) 2011-2017 RhodeCode GmbH

        marcink
    
project: added all source files and assets

              r1
            
      #

      # This program is free software: you can redistribute it and/or modify

      # it under the terms of the GNU Affero General Public License, version 3

      # (only), as published by the Free Software Foundation.

      #

      # This program is distributed in the hope that it will be useful,

      # but WITHOUT ANY WARRANTY; without even the implied warranty of

      # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the

      # GNU General Public License for more details.

      #

      # You should have received a copy of the GNU Affero General Public License

      # along with this program.  If not, see <http://www.gnu.org/licenses/>.

      #

      # This program is dual-licensed. If you wish to learn more about the

      # RhodeCode Enterprise Edition, including its added features, Support services,

      # and proprietary license terms, please see https://rhodecode.com/licenses/

      """

      Renderer for markup languages with ability to parse using rst or markdown

      """

      import re

      import os

      import logging

        marcink
    
readme/markup: improved order of generating readme files. Fixes #4050...

              r396
            
      import itertools

        marcink
    
project: added all source files and assets

              r1
            
      from mako.lookup import TemplateLookup

      from docutils.core import publish_parts

      from docutils.parsers.rst import directives

      import markdown

        marcink
    
markdown: enable full githubFlavoredMarkdown

              r317
            
      from rhodecode.lib.markdown_ext import (

          UrlizeExtension, GithubFlavoredMarkdownExtension)

        marcink
    
project: added all source files and assets

              r1
            
      from rhodecode.lib.utils2 import safe_unicode, md5_safe, MENTIONS_REGEX

      log = logging.getLogger(__name__)

      # default renderer used to generate automated comments

      DEFAULT_COMMENTS_RENDERER = 'rst'

      class MarkupRenderer(object):

          RESTRUCTUREDTEXT_DISALLOWED_DIRECTIVES = ['include', 'meta', 'raw']

          MARKDOWN_PAT = re.compile(r'\.(md|mkdn?|mdown|markdown)$', re.IGNORECASE)

          RST_PAT = re.compile(r'\.re?st$', re.IGNORECASE)

          PLAIN_PAT = re.compile(r'^readme$', re.IGNORECASE)

        marcink
    
readme/markup: improved order of generating readme files. Fixes #4050...

              r396
            
          # extension together with weights. Lower is first means we control how

          # extensions are attached to readme names with those.

          PLAIN_EXTS = [

        johbo
    
renderer: Clean up obsolete code...

              r773
            
              # prefer no extension

        marcink
    
readme/markup: improved order of generating readme files. Fixes #4050...

              r396
            
              ('', 0),  # special case that renders READMES names without extension

              ('.text', 2), ('.TEXT', 2),

              ('.txt', 3), ('.TXT', 3)

          ]

          RST_EXTS = [

              ('.rst', 1), ('.rest', 1),

              ('.RST', 2), ('.REST', 2)

          ]

          MARKDOWN_EXTS = [

              ('.md', 1), ('.MD', 1),

              ('.mkdn', 2), ('.MKDN', 2),

              ('.mdown', 3), ('.MDOWN', 3),

              ('.markdown', 4), ('.MARKDOWN', 4)

          ]

        marcink
    
project: added all source files and assets

              r1
            
          def _detect_renderer(self, source, filename=None):

              """

              runs detection of what renderer should be used for generating html

              from a markup language

              filename can be also explicitly a renderer name

              :param source:

              :param filename:

              """

              if MarkupRenderer.MARKDOWN_PAT.findall(filename):

                  detected_renderer = 'markdown'

              elif MarkupRenderer.RST_PAT.findall(filename):

                  detected_renderer = 'rst'

              elif MarkupRenderer.PLAIN_PAT.findall(filename):

                  detected_renderer = 'rst'

              else:

                  detected_renderer = 'plain'

              return getattr(MarkupRenderer, detected_renderer)

        marcink
    
readme/markup: improved order of generating readme files. Fixes #4050...

              r396
            
          @classmethod

          def renderer_from_filename(cls, filename, exclude):

              """

        marcink
    
renderer: fixed the helper funtion to original version. This...

              r401
            
              Detect renderer markdown/rst from filename and optionally use exclude

              list to remove some options. This is mostly used in helpers.

              Returns None when no renderer can be detected.

        marcink
    
readme/markup: improved order of generating readme files. Fixes #4050...

              r396
            
              """

              def _filter(elements):

                  if isinstance(exclude, (list, tuple)):

                      return [x for x in elements if x not in exclude]

                  return elements

              if filename.endswith(

                      tuple(_filter([x[0] for x in cls.MARKDOWN_EXTS if x[0]]))):

                  return 'markdown'

              if filename.endswith(tuple(_filter([x[0] for x in cls.RST_EXTS if x[0]]))):

                  return 'rst'

        marcink
    
renderer: fixed the helper funtion to original version. This...

              r401
            
              return None

        marcink
    
readme/markup: improved order of generating readme files. Fixes #4050...

              r396
            
        marcink
    
project: added all source files and assets

              r1
            
          def render(self, source, filename=None):

              """

              Renders a given filename using detected renderer

              it detects renderers based on file extension or mimetype.

              At last it will just do a simple html replacing new lines with <br/>

              :param file_name:

              :param source:

              """

              renderer = self._detect_renderer(source, filename)

              readme_data = renderer(source)

              return readme_data

          @classmethod

          def _flavored_markdown(cls, text):

              """

              Github style flavored markdown

              :param text:

              """

              # Extract pre blocks.

              extractions = {}

              def pre_extraction_callback(matchobj):

                  digest = md5_safe(matchobj.group(0))

                  extractions[digest] = matchobj.group(0)

                  return "{gfm-extraction-%s}" % digest

              pattern = re.compile(r'<pre>.*?</pre>', re.MULTILINE | re.DOTALL)

              text = re.sub(pattern, pre_extraction_callback, text)

              # Prevent foo_bar_baz from ending up with an italic word in the middle.

              def italic_callback(matchobj):

                  s = matchobj.group(0)

                  if list(s).count('_') >= 2:

                      return s.replace('_', r'\_')

                  return s

              text = re.sub(r'^(?! {4}|\t)\w+_\w+_\w[\w_]*', italic_callback, text)

              # Insert pre block extractions.

              def pre_insert_callback(matchobj):

                  return '\n\n' + extractions[matchobj.group(1)]

              text = re.sub(r'\{gfm-extraction-([0-9a-f]{32})\}',

                            pre_insert_callback, text)

              return text

          @classmethod

          def urlify_text(cls, text):

              url_pat = re.compile(r'(http[s]?://(?:[a-zA-Z]|[0-9]|[$-_@.&+]'

                                   r'|[!*\(\),]|(?:%[0-9a-fA-F][0-9a-fA-F]))+)')

              def url_func(match_obj):

                  url_full = match_obj.groups()[0]

                  return '<a href="%(url)s">%(url)s</a>' % ({'url': url_full})

              return url_pat.sub(url_func, text)

          @classmethod

          def plain(cls, source, universal_newline=True):

              source = safe_unicode(source)

              if universal_newline:

                  newline = '\n'

                  source = newline.join(source.splitlines())

              source = cls.urlify_text(source)

              return '<br />' + source.replace("\n", '<br />')

          @classmethod

        marcink
    
markdown: enable gfm by default, this is much standard now and we should use it instead of plain markdown

              r318
            
          def markdown(cls, source, safe=True, flavored=True, mentions=False):

        marcink
    
project: added all source files and assets

              r1
            
              # It does not allow to insert inline HTML. In presence of HTML tags, it

              # will replace them instead with [HTML_REMOVED]. This is controlled by

              # the safe_mode=True parameter of the markdown method.

              extensions = ['codehilite', 'extra', 'def_list', 'sane_lists']

              if flavored:

        marcink
    
markdown: enable full githubFlavoredMarkdown

              r317
            
                  extensions.append(GithubFlavoredMarkdownExtension())

        marcink
    
project: added all source files and assets

              r1
            
              if mentions:

                  mention_pat = re.compile(MENTIONS_REGEX)

                  def wrapp(match_obj):

                      uname = match_obj.groups()[0]

                      return ' **@%(uname)s** ' % {'uname': uname}

                  mention_hl = mention_pat.sub(wrapp, source).strip()

                  # we extracted mentions render with this using Mentions false

                  return cls.markdown(mention_hl, safe=safe, flavored=flavored,

                                      mentions=False)

              source = safe_unicode(source)

              try:

                  if flavored:

                      source = cls._flavored_markdown(source)

                  return markdown.markdown(

                      source, extensions, safe_mode=True, enable_attributes=False)

              except Exception:

                  log.exception('Error when rendering Markdown')

                  if safe:

        marcink
    
markdown: enable gfm by default, this is much standard now and we should use it instead of plain markdown

              r318
            
                      log.debug('Fallback to render in plain mode')

        marcink
    
project: added all source files and assets

              r1
            
                      return cls.plain(source)

                  else:

                      raise

          @classmethod

          def rst(cls, source, safe=True, mentions=False):

              if mentions:

                  mention_pat = re.compile(MENTIONS_REGEX)

                  def wrapp(match_obj):

                      uname = match_obj.groups()[0]

                      return ' **@%(uname)s** ' % {'uname': uname}

                  mention_hl = mention_pat.sub(wrapp, source).strip()

                  # we extracted mentions render with this using Mentions false

                  return cls.rst(mention_hl, safe=safe, mentions=False)

              source = safe_unicode(source)

              try:

        marcink
    
markdown: enable gfm by default, this is much standard now and we should use it instead of plain markdown

              r318
            
                  docutils_settings = dict(

                      [(alias, None) for alias in

                       cls.RESTRUCTUREDTEXT_DISALLOWED_DIRECTIVES])

        marcink
    
project: added all source files and assets

              r1
            
                  docutils_settings.update({'input_encoding': 'unicode',

                                            'report_level': 4})

                  for k, v in docutils_settings.iteritems():

                      directives.register_directive(k, v)

                  parts = publish_parts(source=source,

                                        writer_name="html4css1",

                                        settings_overrides=docutils_settings)

                  return parts['html_title'] + parts["fragment"]

              except Exception:

                  log.exception('Error when rendering RST')

                  if safe:

                      log.debug('Fallbacking to render in plain mode')

                      return cls.plain(source)

                  else:

                      raise

      class RstTemplateRenderer(object):

          def __init__(self):

              base = os.path.abspath(os.path.dirname(os.path.dirname(__file__)))

              rst_template_dirs = [os.path.join(base, 'templates', 'rst_templates')]

              self.template_store = TemplateLookup(

                  directories=rst_template_dirs,

                  input_encoding='utf-8',

                  imports=['from rhodecode.lib import helpers as h'])

          def _get_template(self, templatename):

              return self.template_store.get_template(templatename)

          def render(self, template_name, **kwargs):

              template = self._get_template(template_name)

              return template.render(**kwargs)

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages

marcink project: added all source files and assets	r1	# -- coding: utf-8 --

marcink license: updated copyright year to 2017	r1271	# Copyright (C) 2011-2017 RhodeCode GmbH
marcink project: added all source files and assets	r1	#
		# This program is free software: you can redistribute it and/or modify
		# it under the terms of the GNU Affero General Public License, version 3
		# (only), as published by the Free Software Foundation.
		#
		# This program is distributed in the hope that it will be useful,
		# but WITHOUT ANY WARRANTY; without even the implied warranty of
		# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
		# GNU General Public License for more details.
		#
		# You should have received a copy of the GNU Affero General Public License
		# along with this program. If not, see <http://www.gnu.org/licenses/>.
		#
		# This program is dual-licensed. If you wish to learn more about the
		# RhodeCode Enterprise Edition, including its added features, Support services,
		# and proprietary license terms, please see https://rhodecode.com/licenses/


		"""
		Renderer for markup languages with ability to parse using rst or markdown
		"""

		import re
		import os
		import logging
marcink readme/markup: improved order of generating readme files. Fixes #4050...	r396	import itertools

marcink project: added all source files and assets	r1	from mako.lookup import TemplateLookup

		from docutils.core import publish_parts
		from docutils.parsers.rst import directives
		import markdown

marcink markdown: enable full githubFlavoredMarkdown	r317	from rhodecode.lib.markdown_ext import (
		UrlizeExtension, GithubFlavoredMarkdownExtension)
marcink project: added all source files and assets	r1	from rhodecode.lib.utils2 import safe_unicode, md5_safe, MENTIONS_REGEX

		log = logging.getLogger(__name__)

		# default renderer used to generate automated comments
		DEFAULT_COMMENTS_RENDERER = 'rst'


		class MarkupRenderer(object):
		RESTRUCTUREDTEXT_DISALLOWED_DIRECTIVES = ['include', 'meta', 'raw']

		MARKDOWN_PAT = re.compile(r'\.(md\|mkdn?\|mdown\|markdown)$', re.IGNORECASE)
		RST_PAT = re.compile(r'\.re?st$', re.IGNORECASE)
		PLAIN_PAT = re.compile(r'^readme$', re.IGNORECASE)

marcink readme/markup: improved order of generating readme files. Fixes #4050...	r396	# extension together with weights. Lower is first means we control how
		# extensions are attached to readme names with those.
		PLAIN_EXTS = [
johbo renderer: Clean up obsolete code...	r773	# prefer no extension
marcink readme/markup: improved order of generating readme files. Fixes #4050...	r396	('', 0), # special case that renders READMES names without extension
		('.text', 2), ('.TEXT', 2),
		('.txt', 3), ('.TXT', 3)
		]

		RST_EXTS = [
		('.rst', 1), ('.rest', 1),
		('.RST', 2), ('.REST', 2)
		]

		MARKDOWN_EXTS = [
		('.md', 1), ('.MD', 1),
		('.mkdn', 2), ('.MKDN', 2),
		('.mdown', 3), ('.MDOWN', 3),
		('.markdown', 4), ('.MARKDOWN', 4)
		]

marcink project: added all source files and assets	r1	def _detect_renderer(self, source, filename=None):
		"""
		runs detection of what renderer should be used for generating html
		from a markup language

		filename can be also explicitly a renderer name

		:param source:
		:param filename:
		"""

		if MarkupRenderer.MARKDOWN_PAT.findall(filename):
		detected_renderer = 'markdown'
		elif MarkupRenderer.RST_PAT.findall(filename):
		detected_renderer = 'rst'
		elif MarkupRenderer.PLAIN_PAT.findall(filename):
		detected_renderer = 'rst'
		else:
		detected_renderer = 'plain'

		return getattr(MarkupRenderer, detected_renderer)

marcink readme/markup: improved order of generating readme files. Fixes #4050...	r396	@classmethod
		def renderer_from_filename(cls, filename, exclude):
		"""
marcink renderer: fixed the helper funtion to original version. This...	r401	Detect renderer markdown/rst from filename and optionally use exclude
		list to remove some options. This is mostly used in helpers.
		Returns None when no renderer can be detected.
marcink readme/markup: improved order of generating readme files. Fixes #4050...	r396	"""
		def _filter(elements):
		if isinstance(exclude, (list, tuple)):
		return [x for x in elements if x not in exclude]
		return elements

		if filename.endswith(
		tuple(_filter([x[0] for x in cls.MARKDOWN_EXTS if x[0]]))):
		return 'markdown'
		if filename.endswith(tuple(_filter([x[0] for x in cls.RST_EXTS if x[0]]))):
		return 'rst'

marcink renderer: fixed the helper funtion to original version. This...	r401	return None
marcink readme/markup: improved order of generating readme files. Fixes #4050...	r396
marcink project: added all source files and assets	r1	def render(self, source, filename=None):
		"""
		Renders a given filename using detected renderer
		it detects renderers based on file extension or mimetype.
		At last it will just do a simple html replacing new lines with <br/>

		:param file_name:
		:param source:
		"""

		renderer = self._detect_renderer(source, filename)
		readme_data = renderer(source)
		return readme_data

		@classmethod
		def _flavored_markdown(cls, text):
		"""
		Github style flavored markdown

		:param text:
		"""

		# Extract pre blocks.
		extractions = {}

		def pre_extraction_callback(matchobj):
		digest = md5_safe(matchobj.group(0))
		extractions[digest] = matchobj.group(0)
		return "{gfm-extraction-%s}" % digest
		pattern = re.compile(r'<pre>.*?</pre>', re.MULTILINE \| re.DOTALL)
		text = re.sub(pattern, pre_extraction_callback, text)

		# Prevent foo_bar_baz from ending up with an italic word in the middle.
		def italic_callback(matchobj):
		s = matchobj.group(0)
		if list(s).count('_') >= 2:
		return s.replace('_', r'\_')
		return s
		text = re.sub(r'^(?! {4}\|\t)\w+_\w+_\w[\w_]*', italic_callback, text)

		# Insert pre block extractions.
		def pre_insert_callback(matchobj):
		return '\n\n' + extractions[matchobj.group(1)]
		text = re.sub(r'\{gfm-extraction-([0-9a-f]{32})\}',
		pre_insert_callback, text)

		return text

		@classmethod
		def urlify_text(cls, text):
		url_pat = re.compile(r'(http[s]?://(?:[a-zA-Z]\|[0-9]\|[$-_@.&+]'
		r'\|[!*\(\),]\|(?:%[0-9a-fA-F][0-9a-fA-F]))+)')

		def url_func(match_obj):
		url_full = match_obj.groups()[0]
		return '<a href="%(url)s">%(url)s</a>' % ({'url': url_full})

		return url_pat.sub(url_func, text)

		@classmethod
		def plain(cls, source, universal_newline=True):
		source = safe_unicode(source)
		if universal_newline:
		newline = '\n'
		source = newline.join(source.splitlines())

		source = cls.urlify_text(source)
		return '<br />' + source.replace("\n", '<br />')

		@classmethod
marcink markdown: enable gfm by default, this is much standard now and we should use it instead of plain markdown	r318	def markdown(cls, source, safe=True, flavored=True, mentions=False):
marcink project: added all source files and assets	r1	# It does not allow to insert inline HTML. In presence of HTML tags, it
		# will replace them instead with [HTML_REMOVED]. This is controlled by
		# the safe_mode=True parameter of the markdown method.
		extensions = ['codehilite', 'extra', 'def_list', 'sane_lists']
		if flavored:
marcink markdown: enable full githubFlavoredMarkdown	r317	extensions.append(GithubFlavoredMarkdownExtension())
marcink project: added all source files and assets	r1
		if mentions:
		mention_pat = re.compile(MENTIONS_REGEX)

		def wrapp(match_obj):
		uname = match_obj.groups()[0]
		return ' @%(uname)s ' % {'uname': uname}
		mention_hl = mention_pat.sub(wrapp, source).strip()
		# we extracted mentions render with this using Mentions false
		return cls.markdown(mention_hl, safe=safe, flavored=flavored,
		mentions=False)

		source = safe_unicode(source)
		try:
		if flavored:
		source = cls._flavored_markdown(source)
		return markdown.markdown(
		source, extensions, safe_mode=True, enable_attributes=False)
		except Exception:
		log.exception('Error when rendering Markdown')
		if safe:
marcink markdown: enable gfm by default, this is much standard now and we should use it instead of plain markdown	r318	log.debug('Fallback to render in plain mode')
marcink project: added all source files and assets	r1	return cls.plain(source)
		else:
		raise

		@classmethod
		def rst(cls, source, safe=True, mentions=False):
		if mentions:
		mention_pat = re.compile(MENTIONS_REGEX)

		def wrapp(match_obj):
		uname = match_obj.groups()[0]
		return ' @%(uname)s ' % {'uname': uname}
		mention_hl = mention_pat.sub(wrapp, source).strip()
		# we extracted mentions render with this using Mentions false
		return cls.rst(mention_hl, safe=safe, mentions=False)

		source = safe_unicode(source)
		try:
marcink markdown: enable gfm by default, this is much standard now and we should use it instead of plain markdown	r318	docutils_settings = dict(
		[(alias, None) for alias in
		cls.RESTRUCTUREDTEXT_DISALLOWED_DIRECTIVES])
marcink project: added all source files and assets	r1
		docutils_settings.update({'input_encoding': 'unicode',
		'report_level': 4})

		for k, v in docutils_settings.iteritems():
		directives.register_directive(k, v)

		parts = publish_parts(source=source,
		writer_name="html4css1",
		settings_overrides=docutils_settings)

		return parts['html_title'] + parts["fragment"]
		except Exception:
		log.exception('Error when rendering RST')
		if safe:
		log.debug('Fallbacking to render in plain mode')
		return cls.plain(source)
		else:
		raise


		class RstTemplateRenderer(object):

		def __init__(self):
		base = os.path.abspath(os.path.dirname(os.path.dirname(__file__)))
		rst_template_dirs = [os.path.join(base, 'templates', 'rst_templates')]
		self.template_store = TemplateLookup(
		directories=rst_template_dirs,
		input_encoding='utf-8',
		imports=['from rhodecode.lib import helpers as h'])

		def _get_template(self, templatename):
		return self.template_store.get_template(templatename)

		def render(self, template_name, **kwargs):
		template = self._get_template(template_name)
		return template.render(**kwargs)