rhodecode-enterprise-ce Files · rhodecode/lib/markup_renderer.py

feat(archive-cache): re-calculate size better if we miss it in stats

ilin.s - - Load All Authors

File last commit:

r5273:5af2b517 default


                r5425:9c658c9d

default

Download file

             markup_renderer.py
        
                    581 lines
            
             | 19.6 KiB
            
                | text/x-python
            
             |
                PythonLexer
            
             / rhodecode / lib / markup_renderer.py
          
                    History
                
                 |
                  Annotation
                 | Raw
                 |Copy content
                 |Copy permalink

      # Copyright (C) 2011-2023 RhodeCode GmbH

      #

      # This program is free software: you can redistribute it and/or modify

      # it under the terms of the GNU Affero General Public License, version 3

      # (only), as published by the Free Software Foundation.

      #

      # This program is distributed in the hope that it will be useful,

      # but WITHOUT ANY WARRANTY; without even the implied warranty of

      # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the

      # GNU General Public License for more details.

      #

      # You should have received a copy of the GNU Affero General Public License

      # along with this program.  If not, see <http://www.gnu.org/licenses/>.

      #

      # This program is dual-licensed. If you wish to learn more about the

      # RhodeCode Enterprise Edition, including its added features, Support services,

      # and proprietary license terms, please see https://rhodecode.com/licenses/

      """

      Renderer for markup languages with ability to parse using rst or markdown

      """

      import re

      import os

      import lxml

      import logging

      import urllib.parse

      import pycmarkgfm

      from mako.lookup import TemplateLookup

      from mako.template import Template as MakoTemplate

      from docutils.core import publish_parts

      from docutils.parsers.rst import directives

      from docutils import writers

      from docutils.writers import html4css1

      import markdown

      from rhodecode.lib.utils2 import safe_str, MENTIONS_REGEX

      log = logging.getLogger(__name__)

      # default renderer used to generate automated comments

      DEFAULT_COMMENTS_RENDERER = 'rst'

      try:

          from lxml.html import fromstring

          from lxml.html import tostring

      except ImportError:

          log.exception('Failed to import lxml')

          fromstring = None

          tostring = None

      class CustomHTMLTranslator(writers.html4css1.HTMLTranslator):

          """

          Custom HTML Translator used for sandboxing potential

          JS injections in ref links

          """

          def visit_literal_block(self, node):

              self.body.append(self.starttag(node, 'pre', CLASS='codehilite literal-block'))

          def visit_reference(self, node):

              if 'refuri' in node.attributes:

                  refuri = node['refuri']

                  if ':' in refuri:

                      prefix, link = refuri.lstrip().split(':', 1)

                      prefix = prefix or ''

                      if prefix.lower() == 'javascript':

                          # we don't allow javascript type of refs...

                          node['refuri'] = 'javascript:alert("SandBoxedJavascript")'

              # old style class requires this...

              return html4css1.HTMLTranslator.visit_reference(self, node)

      class RhodeCodeWriter(writers.html4css1.Writer):

          def __init__(self):

              super(RhodeCodeWriter, self).__init__()

              self.translator_class = CustomHTMLTranslator

      def relative_links(html_source, server_paths):

          if not html_source:

              return html_source

          if not fromstring and tostring:

              return html_source

          try:

              doc = lxml.html.fromstring(html_source)

          except Exception:

              return html_source

          for el in doc.cssselect('img, video'):

              src = el.attrib.get('src')

              if src:

                  el.attrib['src'] = relative_path(src, server_paths['raw'])

          for el in doc.cssselect('a:not(.gfm)'):

              src = el.attrib.get('href')

              if src:

                  raw_mode = el.attrib['href'].endswith('?raw=1')

                  if raw_mode:

                      el.attrib['href'] = relative_path(src, server_paths['raw'])

                  else:

                      el.attrib['href'] = relative_path(src, server_paths['standard'])

          return lxml.html.tostring(doc, encoding='unicode')

      def relative_path(path, request_path, is_repo_file=None):

          """

          relative link support, path is a rel path, and request_path is current

          server path (not absolute)

          e.g.

          path = '../logo.png'

          request_path= '/repo/files/path/file.md'

          produces: '/repo/files/logo.png'

          """

          # TODO(marcink): unicode/str support ?

          # maybe=> safe_str(urllib.quote(safe_str(final_path), '/:'))

          def dummy_check(p):

              return True  # assume default is a valid file path

          is_repo_file = is_repo_file or dummy_check

          if not path:

              return request_path

          path = safe_str(path)

          request_path = safe_str(request_path)

          if path.startswith(('data:', 'javascript:', '#', ':')):

              # skip data, anchor, invalid links

              return path

          is_absolute = bool(urllib.parse.urlparse(path).netloc)

          if is_absolute:

              return path

          if not request_path:

              return path

          if path.startswith('/'):

              path = path[1:]

          if path.startswith('./'):

              path = path[2:]

          parts = request_path.split('/')

          # compute how deep we need to traverse the request_path

          depth = 0

          if is_repo_file(request_path):

              # if request path is a VALID file, we use a relative path with

              # one level up

              depth += 1

          while path.startswith('../'):

              depth += 1

              path = path[3:]

          if depth > 0:

              parts = parts[:-depth]

          parts.append(path)

          final_path = '/'.join(parts).lstrip('/')

          return '/' + final_path

      _cached_markdown_renderer = None

      def get_markdown_renderer(extensions, output_format):

          global _cached_markdown_renderer

          if _cached_markdown_renderer is None:

              _cached_markdown_renderer = markdown.Markdown(

                  extensions=extensions + ['legacy_attrs'],

                  output_format=output_format)

          return _cached_markdown_renderer

      def get_markdown_renderer_flavored(extensions, output_format):

          """

          Dummy wrapper to mimic markdown API and render github HTML rendered

          """

          md = get_markdown_renderer(extensions, output_format)

          class GFM(object):

              def convert(self, source):

                  with pycmarkgfm.parse_gfm(source, options=pycmarkgfm.options.hardbreaks) as document:

                      parsed_md = document.to_commonmark()

                      return md.convert(parsed_md)

          return GFM()

      class MarkupRenderer(object):

          RESTRUCTUREDTEXT_DISALLOWED_DIRECTIVES = ['include', 'meta', 'raw']

          MARKDOWN_PAT = re.compile(r'\.(md|mkdn?|mdown|markdown)$', re.IGNORECASE)

          RST_PAT = re.compile(r'\.re?st$', re.IGNORECASE)

          JUPYTER_PAT = re.compile(r'\.(ipynb)$', re.IGNORECASE)

          PLAIN_PAT = re.compile(r'^readme$', re.IGNORECASE)

          URL_PAT = re.compile(r'(http[s]?://(?:[a-zA-Z]|[0-9]|[$-_@.&+]'

                               r'|[!*\(\),]|(?:%[0-9a-fA-F][0-9a-fA-F]))+)')

          MENTION_PAT = re.compile(MENTIONS_REGEX)

          extensions = ['markdown.extensions.codehilite', 'markdown.extensions.extra',

                        'markdown.extensions.def_list', 'markdown.extensions.sane_lists']

          output_format = 'html4'

          # extension together with weights. Lower is first means we control how

          # extensions are attached to readme names with those.

          PLAIN_EXTS = [

              # prefer no extension

              ('', 0),  # special case that renders READMES names without extension

              ('.text', 2), ('.TEXT', 2),

              ('.txt', 3), ('.TXT', 3)

          ]

          RST_EXTS = [

              ('.rst', 1), ('.rest', 1),

              ('.RST', 2), ('.REST', 2)

          ]

          MARKDOWN_EXTS = [

              ('.md', 1), ('.MD', 1),

              ('.mkdn', 2), ('.MKDN', 2),

              ('.mdown', 3), ('.MDOWN', 3),

              ('.markdown', 4), ('.MARKDOWN', 4)

          ]

          def _detect_renderer(self, source, filename=None):

              """

              runs detection of what renderer should be used for generating html

              from a markup language

              filename can be also explicitly a renderer name

              :param source:

              :param filename:

              """

              if MarkupRenderer.MARKDOWN_PAT.findall(filename):

                  detected_renderer = 'markdown'

              elif MarkupRenderer.RST_PAT.findall(filename):

                  detected_renderer = 'rst'

              elif MarkupRenderer.JUPYTER_PAT.findall(filename):

                  detected_renderer = 'jupyter'

              elif MarkupRenderer.PLAIN_PAT.findall(filename):

                  detected_renderer = 'plain'

              else:

                  detected_renderer = 'plain'

              return getattr(MarkupRenderer, detected_renderer)

          @classmethod

          def sanitize_html(cls, text):

              from .html_filters import sanitize_html

              return sanitize_html(text, markdown=True)

          @classmethod

          def renderer_from_filename(cls, filename, exclude):

              """

              Detect renderer markdown/rst from filename and optionally use exclude

              list to remove some options. This is mostly used in helpers.

              Returns None when no renderer can be detected.

              """

              def _filter(elements):

                  if isinstance(exclude, (list, tuple)):

                      return [x for x in elements if x not in exclude]

                  return elements

              if filename.endswith(

                      tuple(_filter([x[0] for x in cls.MARKDOWN_EXTS if x[0]]))):

                  return 'markdown'

              if filename.endswith(tuple(_filter([x[0] for x in cls.RST_EXTS if x[0]]))):

                  return 'rst'

              return None

          def render(self, source, filename=None):

              """

              Renders a given filename using detected renderer

              it detects renderers based on file extension or mimetype.

              At last it will just do a simple html replacing new lines with <br/>

              """

              renderer = self._detect_renderer(source, filename)

              readme_data = renderer(source)

              return readme_data

          @classmethod

          def urlify_text(cls, text):

              def url_func(match_obj):

                  url_full = match_obj.groups()[0]

                  return f'<a href="{url_full}">{url_full}</a>'

              return cls.URL_PAT.sub(url_func, text)

          @classmethod

          def convert_mentions(cls, text, mode):

              mention_pat = cls.MENTION_PAT

              def wrapp(match_obj):

                  uname = match_obj.groups()[0]

                  hovercard_url = "pyroutes.url('hovercard_username', {'username': '%s'});" % uname

                  if mode == 'markdown':

                      tmpl = '<strong class="tooltip-hovercard" data-hovercard-alt="{uname}" data-hovercard-url="{hovercard_url}">@{uname}</strong>'

                  elif mode == 'rst':

                      tmpl = ' **@{uname}** '

                  else:

                      raise ValueError('mode must be rst or markdown')

                  return tmpl.format(**{'uname': uname,

                                        'hovercard_url': hovercard_url})

              return mention_pat.sub(wrapp, text).strip()

          @classmethod

          def plain(cls, source, universal_newline=True, leading_newline=True):

              source = safe_str(source)

              if universal_newline:

                  newline = '\n'

                  source = newline.join(source.splitlines())

              rendered_source = cls.urlify_text(source)

              source = ''

              if leading_newline:

                  source += '<br />'

              source += rendered_source.replace("\n", '<br />')

              rendered = cls.sanitize_html(source)

              return rendered

          @classmethod

          def markdown(cls, source, safe=True, flavored=True, mentions=False,

                       clean_html=True):

              """

              returns markdown rendered code cleaned by the bleach library

              """

              if flavored:

                  markdown_renderer = get_markdown_renderer_flavored(

                      cls.extensions, cls.output_format)

              else:

                  markdown_renderer = get_markdown_renderer(

                      cls.extensions, cls.output_format)

              if mentions:

                  mention_hl = cls.convert_mentions(source, mode='markdown')

                  # we extracted mentions render with this using Mentions false

                  return cls.markdown(mention_hl, safe=safe, flavored=flavored,

                                      mentions=False)

              try:

                  rendered = markdown_renderer.convert(source)

              except Exception:

                  log.exception('Error when rendering Markdown')

                  if safe:

                      log.debug('Fallback to render in plain mode')

                      rendered = cls.plain(source)

                  else:

                      raise

              if clean_html:

                  rendered = cls.sanitize_html(rendered)

              return rendered

          @classmethod

          def rst(cls, source, safe=True, mentions=False, clean_html=False):

              if mentions:

                  mention_hl = cls.convert_mentions(source, mode='rst')

                  # we extracted mentions render with this using Mentions false

                  return cls.rst(mention_hl, safe=safe, mentions=False)

              source = safe_str(source)

              try:

                  docutils_settings = dict(

                      [(alias, None) for alias in

                       cls.RESTRUCTUREDTEXT_DISALLOWED_DIRECTIVES])

                  docutils_settings.update({

                      'input_encoding': 'unicode',

                      'report_level': 4,

                      'syntax_highlight': 'short',

                  })

                  for k, v in list(docutils_settings.items()):

                      directives.register_directive(k, v)

                  parts = publish_parts(source=source,

                                        writer=RhodeCodeWriter(),

                                        settings_overrides=docutils_settings)

                  rendered = parts["fragment"]

                  if clean_html:

                      rendered = cls.sanitize_html(rendered)

                  return parts['html_title'] + rendered

              except Exception:

                  log.exception('Error when rendering RST')

                  if safe:

                      log.debug('Fallback to render in plain mode')

                      return cls.plain(source)

                  else:

                      raise

          @classmethod

          def jupyter(cls, source, safe=True):

              from rhodecode.lib import helpers

              from .html_sanitizer_defs import markdown_attrs, all_tags, all_styles

              from traitlets import default, config

              import nbformat

              from nbconvert import HTMLExporter

              from nbconvert.preprocessors import Preprocessor

              from nbconvert.preprocessors.sanitize import SanitizeHTML

              class CustomHTMLExporter(HTMLExporter):

                  @default("template_file")

                  def _template_file_default(self):

                      if self.template_extension:

                          return "basic/index" + self.template_extension

              class Sandbox(Preprocessor):

                  def preprocess_cell(self, cell, resources, cell_index):

                      if not safe:

                          return cell, resources

                      sandbox_text = 'SandBoxed(IPython.core.display.Javascript object)'

                      if cell.cell_type == "markdown":

                          cell.source = cls.sanitize_html(cell.source)

                          return cell, resources

                      for cell_output in cell.get('outputs', []):

                          if 'data' in cell_output:

                              if 'application/javascript' in cell_output['data']:

                                  cell_output['data']['text/plain'] = sandbox_text

                                  cell_output['data'].pop('application/javascript', None)

                      return cell, resources

              def _sanitize_resources(input_resources):

                  """

                  Skip/sanitize some of the CSS generated and included in jupyter

                  so it doesn't mess up UI so much

                  """

                  # TODO(marcink): probably we should replace this with whole custom

                  # CSS set that doesn't screw up, but jupyter generated html has some

                  # special markers, so it requires Custom HTML exporter template with

                  # _default_template_path_default, to achieve that

                  # strip the reset CSS

                  input_resources[0] = input_resources[0][input_resources[0].find('/*! Source'):]

                  return input_resources

              def as_html(notebook):

                  conf = config.Config()

                  # TODO: Keep an eye on the order of preprocessors

                  conf.CustomHTMLExporter.default_preprocessors = [Sandbox, SanitizeHTML]

                  conf.Sandbox.enabled = True

                  conf.SanitizeHTML.enabled = True

                  conf.SanitizeHTML.attributes = markdown_attrs

                  conf.SanitizeHTML.tags = all_tags

                  conf.SanitizeHTML.styles = all_styles

                  conf.SanitizeHTML.sanitized_output_types = {

                      "text/html",

                      "text/markdown",

                  }

                  conf.SanitizeHTML.safe_output_keys = {

                      "metadata",

                      "text/plain",

                      "text/latex",

                      "application/json",

                      "image/png",

                      "image/jpg"

                      "image/jpeg",

                      "image/svg",

                      "image/svg+xml"

                  }

                  html_exporter = CustomHTMLExporter(config=conf)

                  (body, resources) = html_exporter.from_notebook_node(notebook)

                  header = '<!-- ## IPYTHON NOTEBOOK RENDERING ## -->'

                  js = MakoTemplate(r'''

                  <!-- MathJax configuration -->

                  <script type="text/x-mathjax-config">

                  MathJax.Hub.Config({

                      jax: ["input/TeX","output/HTML-CSS", "output/PreviewHTML"],

                      extensions: ["tex2jax.js","MathMenu.js","MathZoom.js", "fast-preview.js", "AssistiveMML.js", "[Contrib]/a11y/accessibility-menu.js"],

                      TeX: {

                          extensions: ["AMSmath.js","AMSsymbols.js","noErrors.js","noUndefined.js"]

                      },

                      tex2jax: {

                          inlineMath: [ ['$','$'], ["\\(","\\)"] ],

                          displayMath: [ ['$$','$$'], ["\\[","\\]"] ],

                          processEscapes: true,

                          processEnvironments: true

                      },

                      // Center justify equations in code and markdown cells. Elsewhere

                      // we use CSS to left justify single line equations in code cells.

                      displayAlign: 'center',

                      "HTML-CSS": {

                          styles: {'.MathJax_Display': {"margin": 0}},

                          linebreaks: { automatic: true },

                          availableFonts: ["STIX", "TeX"]

                      },

                      showMathMenu: false

                  });

                  </script>

                  <!-- End of MathJax configuration -->

                  <script src="${h.asset('js/src/math_jax/MathJax.js')}"></script>

                  ''').render(h=helpers)

                  css = MakoTemplate(r'''

                  <link rel="stylesheet" type="text/css" href="${h.asset('css/style-ipython.css', ver=ver)}" media="screen"/>

                  ''').render(h=helpers, ver='ver1')

                  body = '\n'.join([header, css, js, body])

                  return body, resources

              captured_errors = {}

              error_body = """

                              <div style="text-align: center;">

                                  <h3>Invalid Notebook!</h3>

                                  <p>{}</p>

                              </div>

                          """

              # TODO: In the event of a newer jupyter notebook version, consider increasing the as_version parameter

              notebook = nbformat.reads(source, as_version=4, capture_validation_error=captured_errors)

              if captured_errors:

                  error_messages = '<br>'.join(str(error) for error in captured_errors.values())

                  body = error_body.format(error_messages)

              else:

                  try:

                      body, _ = as_html(notebook)

                  except (AttributeError, nbformat.ValidationError):

                      try:

                          nbformat.validate(nbformat.reader.reads(source))

                      except nbformat.ValidationError as exc:

                          body = error_body.format(str(exc))

                      else:

                          raise

              return body

      class RstTemplateRenderer(object):

          def __init__(self):

              base = os.path.abspath(os.path.dirname(os.path.dirname(__file__)))

              rst_template_dirs = [os.path.join(base, 'templates', 'rst_templates')]

              self.template_store = TemplateLookup(

                  directories=rst_template_dirs,

                  input_encoding='utf-8',

                  imports=['from rhodecode.lib import helpers as h'])

          def _get_template(self, templatename):

              return self.template_store.get_template(templatename)

          def render(self, template_name, **kwargs):

              template = self._get_template(template_name)

              return template.render(**kwargs)

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages



				# Copyright (C) 2011-2023 RhodeCode GmbH
				#
				# This program is free software: you can redistribute it and/or modify
				# it under the terms of the GNU Affero General Public License, version 3
				# (only), as published by the Free Software Foundation.
				#
				# This program is distributed in the hope that it will be useful,
				# but WITHOUT ANY WARRANTY; without even the implied warranty of
				# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
				# GNU General Public License for more details.
				#
				# You should have received a copy of the GNU Affero General Public License
				# along with this program. If not, see <http://www.gnu.org/licenses/>.
				#
				# This program is dual-licensed. If you wish to learn more about the
				# RhodeCode Enterprise Edition, including its added features, Support services,
				# and proprietary license terms, please see https://rhodecode.com/licenses/


				"""
				Renderer for markup languages with ability to parse using rst or markdown
				"""

				import re
				import os
				import lxml
				import logging
				import urllib.parse
				import pycmarkgfm

				from mako.lookup import TemplateLookup
				from mako.template import Template as MakoTemplate

				from docutils.core import publish_parts
				from docutils.parsers.rst import directives
				from docutils import writers
				from docutils.writers import html4css1
				import markdown

				from rhodecode.lib.utils2 import safe_str, MENTIONS_REGEX

				log = logging.getLogger(__name__)

				# default renderer used to generate automated comments
				DEFAULT_COMMENTS_RENDERER = 'rst'

				try:
				from lxml.html import fromstring
				from lxml.html import tostring
				except ImportError:
				log.exception('Failed to import lxml')
				fromstring = None
				tostring = None


				class CustomHTMLTranslator(writers.html4css1.HTMLTranslator):
				"""
				Custom HTML Translator used for sandboxing potential
				JS injections in ref links
				"""
				def visit_literal_block(self, node):
				self.body.append(self.starttag(node, 'pre', CLASS='codehilite literal-block'))

				def visit_reference(self, node):
				if 'refuri' in node.attributes:
				refuri = node['refuri']
				if ':' in refuri:
				prefix, link = refuri.lstrip().split(':', 1)
				prefix = prefix or ''

				if prefix.lower() == 'javascript':
				# we don't allow javascript type of refs...
				node['refuri'] = 'javascript:alert("SandBoxedJavascript")'

				# old style class requires this...
				return html4css1.HTMLTranslator.visit_reference(self, node)


				class RhodeCodeWriter(writers.html4css1.Writer):
				def __init__(self):
				super(RhodeCodeWriter, self).__init__()
				self.translator_class = CustomHTMLTranslator


				def relative_links(html_source, server_paths):
				if not html_source:
				return html_source

				if not fromstring and tostring:
				return html_source

				try:
				doc = lxml.html.fromstring(html_source)
				except Exception:
				return html_source

				for el in doc.cssselect('img, video'):
				src = el.attrib.get('src')
				if src:
				el.attrib['src'] = relative_path(src, server_paths['raw'])

				for el in doc.cssselect('a:not(.gfm)'):
				src = el.attrib.get('href')
				if src:
				raw_mode = el.attrib['href'].endswith('?raw=1')
				if raw_mode:
				el.attrib['href'] = relative_path(src, server_paths['raw'])
				else:
				el.attrib['href'] = relative_path(src, server_paths['standard'])

				return lxml.html.tostring(doc, encoding='unicode')


				def relative_path(path, request_path, is_repo_file=None):
				"""
				relative link support, path is a rel path, and request_path is current
				server path (not absolute)

				e.g.

				path = '../logo.png'
				request_path= '/repo/files/path/file.md'
				produces: '/repo/files/logo.png'
				"""
				# TODO(marcink): unicode/str support ?
				# maybe=> safe_str(urllib.quote(safe_str(final_path), '/:'))

				def dummy_check(p):
				return True # assume default is a valid file path

				is_repo_file = is_repo_file or dummy_check
				if not path:
				return request_path

				path = safe_str(path)
				request_path = safe_str(request_path)

				if path.startswith(('data:', 'javascript:', '#', ':')):
				# skip data, anchor, invalid links
				return path

				is_absolute = bool(urllib.parse.urlparse(path).netloc)
				if is_absolute:
				return path

				if not request_path:
				return path

				if path.startswith('/'):
				path = path[1:]

				if path.startswith('./'):
				path = path[2:]

				parts = request_path.split('/')
				# compute how deep we need to traverse the request_path
				depth = 0

				if is_repo_file(request_path):
				# if request path is a VALID file, we use a relative path with
				# one level up
				depth += 1

				while path.startswith('../'):
				depth += 1
				path = path[3:]

				if depth > 0:
				parts = parts[:-depth]

				parts.append(path)
				final_path = '/'.join(parts).lstrip('/')

				return '/' + final_path


				_cached_markdown_renderer = None


				def get_markdown_renderer(extensions, output_format):
				global _cached_markdown_renderer

				if _cached_markdown_renderer is None:
				_cached_markdown_renderer = markdown.Markdown(
				extensions=extensions + ['legacy_attrs'],
				output_format=output_format)
				return _cached_markdown_renderer


				def get_markdown_renderer_flavored(extensions, output_format):
				"""
				Dummy wrapper to mimic markdown API and render github HTML rendered

				"""
				md = get_markdown_renderer(extensions, output_format)

				class GFM(object):
				def convert(self, source):
				with pycmarkgfm.parse_gfm(source, options=pycmarkgfm.options.hardbreaks) as document:
				parsed_md = document.to_commonmark()
				return md.convert(parsed_md)

				return GFM()


				class MarkupRenderer(object):
				RESTRUCTUREDTEXT_DISALLOWED_DIRECTIVES = ['include', 'meta', 'raw']

				MARKDOWN_PAT = re.compile(r'\.(md\|mkdn?\|mdown\|markdown)$', re.IGNORECASE)
				RST_PAT = re.compile(r'\.re?st$', re.IGNORECASE)
				JUPYTER_PAT = re.compile(r'\.(ipynb)$', re.IGNORECASE)
				PLAIN_PAT = re.compile(r'^readme$', re.IGNORECASE)

				URL_PAT = re.compile(r'(http[s]?://(?:[a-zA-Z]\|[0-9]\|[$-_@.&+]'
				r'\|[!*\(\),]\|(?:%[0-9a-fA-F][0-9a-fA-F]))+)')

				MENTION_PAT = re.compile(MENTIONS_REGEX)

				extensions = ['markdown.extensions.codehilite', 'markdown.extensions.extra',
				'markdown.extensions.def_list', 'markdown.extensions.sane_lists']

				output_format = 'html4'

				# extension together with weights. Lower is first means we control how
				# extensions are attached to readme names with those.
				PLAIN_EXTS = [
				# prefer no extension
				('', 0), # special case that renders READMES names without extension
				('.text', 2), ('.TEXT', 2),
				('.txt', 3), ('.TXT', 3)
				]

				RST_EXTS = [
				('.rst', 1), ('.rest', 1),
				('.RST', 2), ('.REST', 2)
				]

				MARKDOWN_EXTS = [
				('.md', 1), ('.MD', 1),
				('.mkdn', 2), ('.MKDN', 2),
				('.mdown', 3), ('.MDOWN', 3),
				('.markdown', 4), ('.MARKDOWN', 4)
				]

				def _detect_renderer(self, source, filename=None):
				"""
				runs detection of what renderer should be used for generating html
				from a markup language

				filename can be also explicitly a renderer name

				:param source:
				:param filename:
				"""

				if MarkupRenderer.MARKDOWN_PAT.findall(filename):
				detected_renderer = 'markdown'
				elif MarkupRenderer.RST_PAT.findall(filename):
				detected_renderer = 'rst'
				elif MarkupRenderer.JUPYTER_PAT.findall(filename):
				detected_renderer = 'jupyter'
				elif MarkupRenderer.PLAIN_PAT.findall(filename):
				detected_renderer = 'plain'
				else:
				detected_renderer = 'plain'

				return getattr(MarkupRenderer, detected_renderer)

				@classmethod
				def sanitize_html(cls, text):
				from .html_filters import sanitize_html
				return sanitize_html(text, markdown=True)

				@classmethod
				def renderer_from_filename(cls, filename, exclude):
				"""
				Detect renderer markdown/rst from filename and optionally use exclude
				list to remove some options. This is mostly used in helpers.
				Returns None when no renderer can be detected.
				"""
				def _filter(elements):
				if isinstance(exclude, (list, tuple)):
				return [x for x in elements if x not in exclude]
				return elements

				if filename.endswith(
				tuple(_filter([x[0] for x in cls.MARKDOWN_EXTS if x[0]]))):
				return 'markdown'
				if filename.endswith(tuple(_filter([x[0] for x in cls.RST_EXTS if x[0]]))):
				return 'rst'

				return None

				def render(self, source, filename=None):
				"""
				Renders a given filename using detected renderer
				it detects renderers based on file extension or mimetype.
				At last it will just do a simple html replacing new lines with <br/>
				"""

				renderer = self._detect_renderer(source, filename)
				readme_data = renderer(source)
				return readme_data

				@classmethod
				def urlify_text(cls, text):
				def url_func(match_obj):
				url_full = match_obj.groups()[0]
				return f'<a href="{url_full}">{url_full}</a>'

				return cls.URL_PAT.sub(url_func, text)

				@classmethod
				def convert_mentions(cls, text, mode):
				mention_pat = cls.MENTION_PAT

				def wrapp(match_obj):
				uname = match_obj.groups()[0]
				hovercard_url = "pyroutes.url('hovercard_username', {'username': '%s'});" % uname

				if mode == 'markdown':
				tmpl = '<strong class="tooltip-hovercard" data-hovercard-alt="{uname}" data-hovercard-url="{hovercard_url}">@{uname}</strong>'
				elif mode == 'rst':
				tmpl = ' @{uname} '
				else:
				raise ValueError('mode must be rst or markdown')

				return tmpl.format(**{'uname': uname,
				'hovercard_url': hovercard_url})

				return mention_pat.sub(wrapp, text).strip()

				@classmethod
				def plain(cls, source, universal_newline=True, leading_newline=True):
				source = safe_str(source)
				if universal_newline:
				newline = '\n'
				source = newline.join(source.splitlines())

				rendered_source = cls.urlify_text(source)
				source = ''
				if leading_newline:
				source += '<br />'
				source += rendered_source.replace("\n", '<br />')

				rendered = cls.sanitize_html(source)
				return rendered

				@classmethod
				def markdown(cls, source, safe=True, flavored=True, mentions=False,
				clean_html=True):
				"""
				returns markdown rendered code cleaned by the bleach library
				"""

				if flavored:
				markdown_renderer = get_markdown_renderer_flavored(
				cls.extensions, cls.output_format)
				else:
				markdown_renderer = get_markdown_renderer(
				cls.extensions, cls.output_format)

				if mentions:
				mention_hl = cls.convert_mentions(source, mode='markdown')
				# we extracted mentions render with this using Mentions false
				return cls.markdown(mention_hl, safe=safe, flavored=flavored,
				mentions=False)

				try:
				rendered = markdown_renderer.convert(source)

				except Exception:
				log.exception('Error when rendering Markdown')
				if safe:
				log.debug('Fallback to render in plain mode')
				rendered = cls.plain(source)
				else:
				raise

				if clean_html:
				rendered = cls.sanitize_html(rendered)
				return rendered

				@classmethod
				def rst(cls, source, safe=True, mentions=False, clean_html=False):

				if mentions:
				mention_hl = cls.convert_mentions(source, mode='rst')
				# we extracted mentions render with this using Mentions false
				return cls.rst(mention_hl, safe=safe, mentions=False)

				source = safe_str(source)
				try:
				docutils_settings = dict(
				[(alias, None) for alias in
				cls.RESTRUCTUREDTEXT_DISALLOWED_DIRECTIVES])

				docutils_settings.update({
				'input_encoding': 'unicode',
				'report_level': 4,
				'syntax_highlight': 'short',
				})

				for k, v in list(docutils_settings.items()):
				directives.register_directive(k, v)

				parts = publish_parts(source=source,
				writer=RhodeCodeWriter(),
				settings_overrides=docutils_settings)
				rendered = parts["fragment"]
				if clean_html:
				rendered = cls.sanitize_html(rendered)
				return parts['html_title'] + rendered
				except Exception:
				log.exception('Error when rendering RST')
				if safe:
				log.debug('Fallback to render in plain mode')
				return cls.plain(source)
				else:
				raise

				@classmethod
				def jupyter(cls, source, safe=True):
				from rhodecode.lib import helpers
				from .html_sanitizer_defs import markdown_attrs, all_tags, all_styles

				from traitlets import default, config
				import nbformat
				from nbconvert import HTMLExporter
				from nbconvert.preprocessors import Preprocessor
				from nbconvert.preprocessors.sanitize import SanitizeHTML

				class CustomHTMLExporter(HTMLExporter):

				@default("template_file")
				def _template_file_default(self):
				if self.template_extension:
				return "basic/index" + self.template_extension

				class Sandbox(Preprocessor):

				def preprocess_cell(self, cell, resources, cell_index):
				if not safe:
				return cell, resources
				sandbox_text = 'SandBoxed(IPython.core.display.Javascript object)'
				if cell.cell_type == "markdown":
				cell.source = cls.sanitize_html(cell.source)
				return cell, resources

				for cell_output in cell.get('outputs', []):
				if 'data' in cell_output:
				if 'application/javascript' in cell_output['data']:
				cell_output['data']['text/plain'] = sandbox_text
				cell_output['data'].pop('application/javascript', None)
				return cell, resources

				def _sanitize_resources(input_resources):
				"""
				Skip/sanitize some of the CSS generated and included in jupyter
				so it doesn't mess up UI so much
				"""

				# TODO(marcink): probably we should replace this with whole custom
				# CSS set that doesn't screw up, but jupyter generated html has some
				# special markers, so it requires Custom HTML exporter template with
				# _default_template_path_default, to achieve that

				# strip the reset CSS
				input_resources[0] = input_resources[0][input_resources[0].find('/*! Source'):]
				return input_resources

				def as_html(notebook):
				conf = config.Config()
				# TODO: Keep an eye on the order of preprocessors
				conf.CustomHTMLExporter.default_preprocessors = [Sandbox, SanitizeHTML]
				conf.Sandbox.enabled = True
				conf.SanitizeHTML.enabled = True
				conf.SanitizeHTML.attributes = markdown_attrs
				conf.SanitizeHTML.tags = all_tags
				conf.SanitizeHTML.styles = all_styles
				conf.SanitizeHTML.sanitized_output_types = {
				"text/html",
				"text/markdown",
				}
				conf.SanitizeHTML.safe_output_keys = {
				"metadata",
				"text/plain",
				"text/latex",
				"application/json",
				"image/png",
				"image/jpg"
				"image/jpeg",
				"image/svg",
				"image/svg+xml"
				}

				html_exporter = CustomHTMLExporter(config=conf)

				(body, resources) = html_exporter.from_notebook_node(notebook)

				header = '<!-- ## IPYTHON NOTEBOOK RENDERING ## -->'
				js = MakoTemplate(r'''
				<!-- MathJax configuration -->
				<script type="text/x-mathjax-config">
				MathJax.Hub.Config({
				jax: ["input/TeX","output/HTML-CSS", "output/PreviewHTML"],
				extensions: ["tex2jax.js","MathMenu.js","MathZoom.js", "fast-preview.js", "AssistiveMML.js", "[Contrib]/a11y/accessibility-menu.js"],
				TeX: {
				extensions: ["AMSmath.js","AMSsymbols.js","noErrors.js","noUndefined.js"]
				},
				tex2jax: {
				inlineMath: [ ['$','$'], ["\\(","\\)"] ],
				displayMath: [ ['$$','$$'], ["\\[","\\]"] ],
				processEscapes: true,
				processEnvironments: true
				},
				// Center justify equations in code and markdown cells. Elsewhere
				// we use CSS to left justify single line equations in code cells.
				displayAlign: 'center',
				"HTML-CSS": {
				styles: {'.MathJax_Display': {"margin": 0}},
				linebreaks: { automatic: true },
				availableFonts: ["STIX", "TeX"]
				},
				showMathMenu: false
				});
				</script>
				<!-- End of MathJax configuration -->
				<script src="${h.asset('js/src/math_jax/MathJax.js')}"></script>
				''').render(h=helpers)

				css = MakoTemplate(r'''
				<link rel="stylesheet" type="text/css" href="${h.asset('css/style-ipython.css', ver=ver)}" media="screen"/>
				''').render(h=helpers, ver='ver1')

				body = '\n'.join([header, css, js, body])
				return body, resources

				captured_errors = {}
				error_body = """
				<div style="text-align: center;">
				<h3>Invalid Notebook!</h3>
				<p>{}</p>
				</div>
				"""
				# TODO: In the event of a newer jupyter notebook version, consider increasing the as_version parameter
				notebook = nbformat.reads(source, as_version=4, capture_validation_error=captured_errors)
				if captured_errors:
				error_messages = '<br>'.join(str(error) for error in captured_errors.values())
				body = error_body.format(error_messages)
				else:
				try:
				body, _ = as_html(notebook)
				except (AttributeError, nbformat.ValidationError):
				try:
				nbformat.validate(nbformat.reader.reads(source))
				except nbformat.ValidationError as exc:
				body = error_body.format(str(exc))
				else:
				raise
				return body


				class RstTemplateRenderer(object):

				def __init__(self):
				base = os.path.abspath(os.path.dirname(os.path.dirname(__file__)))
				rst_template_dirs = [os.path.join(base, 'templates', 'rst_templates')]
				self.template_store = TemplateLookup(
				directories=rst_template_dirs,
				input_encoding='utf-8',
				imports=['from rhodecode.lib import helpers as h'])

				def _get_template(self, templatename):
				return self.template_store.get_template(templatename)

				def render(self, template_name, **kwargs):
				template = self._get_template(template_name)
				return template.render(**kwargs)