markdown_ext.py
176 lines
| 6.0 KiB
| text/x-python
|
PythonLexer
r1 | # -*- coding: utf-8 -*- | |||
r4306 | # Copyright (C) 2010-2020 RhodeCode GmbH | |||
r1 | # | |||
# This program is free software: you can redistribute it and/or modify | ||||
# it under the terms of the GNU Affero General Public License, version 3 | ||||
# (only), as published by the Free Software Foundation. | ||||
# | ||||
# This program is distributed in the hope that it will be useful, | ||||
# but WITHOUT ANY WARRANTY; without even the implied warranty of | ||||
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the | ||||
# GNU General Public License for more details. | ||||
# | ||||
# You should have received a copy of the GNU Affero General Public License | ||||
# along with this program. If not, see <http://www.gnu.org/licenses/>. | ||||
# | ||||
# This program is dual-licensed. If you wish to learn more about the | ||||
# RhodeCode Enterprise Edition, including its added features, Support services, | ||||
# and proprietary license terms, please see https://rhodecode.com/licenses/ | ||||
r4533 | import re | |||
r1 | import markdown | |||
r4533 | import xml.etree.ElementTree as etree | |||
r1 | ||||
r3683 | from markdown.extensions import Extension | |||
from markdown.extensions.fenced_code import FencedCodeExtension | ||||
from markdown.extensions.tables import TableExtension | ||||
r4533 | from markdown.inlinepatterns import Pattern | |||
r3683 | ||||
import gfm | ||||
r4533 | class InlineProcessor(Pattern): | |||
""" | ||||
Base class that inline patterns subclass. | ||||
This is the newer style inline processor that uses a more | ||||
efficient and flexible search approach. | ||||
""" | ||||
def __init__(self, pattern, md=None): | ||||
""" | ||||
Create an instant of an inline pattern. | ||||
Keyword arguments: | ||||
* pattern: A regular expression that matches a pattern | ||||
""" | ||||
self.pattern = pattern | ||||
self.compiled_re = re.compile(pattern, re.DOTALL | re.UNICODE) | ||||
# Api for Markdown to pass safe_mode into instance | ||||
self.safe_mode = False | ||||
self.md = md | ||||
def handleMatch(self, m, data): | ||||
"""Return a ElementTree element from the given match and the | ||||
start and end index of the matched text. | ||||
If `start` and/or `end` are returned as `None`, it will be | ||||
assumed that the processor did not find a valid region of text. | ||||
Subclasses should override this method. | ||||
Keyword arguments: | ||||
* m: A re match object containing a match of the pattern. | ||||
* data: The buffer current under analysis | ||||
Returns: | ||||
* el: The ElementTree element, text or None. | ||||
* start: The start of the region that has been matched or None. | ||||
* end: The end of the region that has been matched or None. | ||||
""" | ||||
pass # pragma: no cover | ||||
class SimpleTagInlineProcessor(InlineProcessor): | ||||
""" | ||||
Return element of type `tag` with a text attribute of group(2) | ||||
of a Pattern. | ||||
""" | ||||
def __init__(self, pattern, tag): | ||||
InlineProcessor.__init__(self, pattern) | ||||
self.tag = tag | ||||
def handleMatch(self, m, data): # pragma: no cover | ||||
el = etree.Element(self.tag) | ||||
el.text = m.group(2) | ||||
return el, m.start(0), m.end(0) | ||||
class SubstituteTagInlineProcessor(SimpleTagInlineProcessor): | ||||
""" Return an element of type `tag` with no children. """ | ||||
def handleMatch(self, m, data): | ||||
return etree.Element(self.tag), m.start(0), m.end(0) | ||||
class Nl2BrExtension(Extension): | ||||
BR_RE = r'\n' | ||||
def extendMarkdown(self, md, md_globals): | ||||
br_tag = SubstituteTagInlineProcessor(self.BR_RE, 'br') | ||||
md.inlinePatterns.add('nl', br_tag, '_end') | ||||
r3683 | class GithubFlavoredMarkdownExtension(Extension): | |||
""" | ||||
An extension that is as compatible as possible with GitHub-flavored | ||||
Markdown (GFM). | ||||
This extension aims to be compatible with the variant of GFM that GitHub | ||||
uses for Markdown-formatted gists and files (including READMEs). This | ||||
variant seems to have all the extensions described in the `GFM | ||||
documentation`_, except: | ||||
- Newlines in paragraphs are not transformed into ``br`` tags. | ||||
- Intra-GitHub links to commits, repositories, and issues are not | ||||
supported. | ||||
If you need support for features specific to GitHub comments and issues, | ||||
please use :class:`mdx_gfm.GithubFlavoredMarkdownExtension`. | ||||
.. _GFM documentation: https://guides.github.com/features/mastering-markdown/ | ||||
""" | ||||
def extendMarkdown(self, md, md_globals): | ||||
# Built-in extensions | ||||
r4533 | Nl2BrExtension().extendMarkdown(md, md_globals) | |||
r3683 | FencedCodeExtension().extendMarkdown(md, md_globals) | |||
TableExtension().extendMarkdown(md, md_globals) | ||||
# Custom extensions | ||||
gfm.AutolinkExtension().extendMarkdown(md, md_globals) | ||||
gfm.AutomailExtension().extendMarkdown(md, md_globals) | ||||
gfm.HiddenHiliteExtension([ | ||||
('guess_lang', 'False'), | ||||
('css_class', 'highlight') | ||||
]).extendMarkdown(md, md_globals) | ||||
gfm.SemiSaneListExtension().extendMarkdown(md, md_globals) | ||||
gfm.SpacedLinkExtension().extendMarkdown(md, md_globals) | ||||
gfm.StrikethroughExtension().extendMarkdown(md, md_globals) | ||||
gfm.TaskListExtension([ | ||||
('list_attrs', {'class': 'checkbox'}) | ||||
]).extendMarkdown(md, md_globals) | ||||
r1 | ||||
# Global Vars | ||||
URLIZE_RE = '(%s)' % '|'.join([ | ||||
r'<(?:f|ht)tps?://[^>]*>', | ||||
r'\b(?:f|ht)tps?://[^)<>\s]+[^.,)<>\s]', | ||||
r'\bwww\.[^)<>\s]+[^.,)<>\s]', | ||||
r'[^(<\s]+\.(?:com|net|org)\b', | ||||
]) | ||||
r317 | ||||
r1 | class UrlizePattern(markdown.inlinepatterns.Pattern): | |||
""" Return a link Element given an autolink (`http://example/com`). """ | ||||
def handleMatch(self, m): | ||||
url = m.group(2) | ||||
if url.startswith('<'): | ||||
url = url[1:-1] | ||||
text = url | ||||
if not url.split('://')[0] in ('http','https','ftp'): | ||||
if '@' in url and not '/' in url: | ||||
url = 'mailto:' + url | ||||
else: | ||||
url = 'http://' + url | ||||
el = markdown.util.etree.Element("a") | ||||
el.set('href', url) | ||||
el.text = markdown.util.AtomicString(text) | ||||
return el | ||||
class UrlizeExtension(markdown.Extension): | ||||
""" Urlize Extension for Python-Markdown. """ | ||||
def extendMarkdown(self, md, md_globals): | ||||
""" Replace autolink with UrlizePattern """ | ||||
md.inlinePatterns['autolink'] = UrlizePattern(URLIZE_RE, md) | ||||