upstream/ipython Commit - r17259:90f2049a

Fix mathjax pass-through with mistune

Thomas Kluyver -

r17259:90f2049a

parent child

IPython/nbconvert/filters/markdown.py

0 +20 -17

             """Markdown filters
             This file contains a collection of utility filters for dealing with
             markdown within Jinja templates.
             """
-            #-----------------------------------------------------------------------------
+            # Copyright (c) IPython Development Team.
-            # Copyright (c) 2013, the IPython Development Team.
             # Distributed under the terms of the Modified BSD License.
-            # The full license is in the file COPYING.txt, distributed with this software.
-            #-----------------------------------------------------------------------------
-            #-----------------------------------------------------------------------------
-            # Imports
-            #-----------------------------------------------------------------------------
             from __future__ import print_function
             # Stdlib imports
             import os
             import subprocess
             from io import TextIOWrapper, BytesIO
             import re
             import mistune
             from pygments import highlight
             from pygments.lexers import get_lexer_by_name
             from pygments.formatters import HtmlFormatter
             from pygments.util import ClassNotFound
             # IPython imports
             from IPython.nbconvert.utils.pandoc import pandoc
             from IPython.nbconvert.utils.exceptions import ConversionException
             from IPython.utils.process import get_output_error_code
             from IPython.utils.py3compat import cast_bytes
             from IPython.utils.version import check_version
-            #-----------------------------------------------------------------------------
-            # Functions
-            #-----------------------------------------------------------------------------
             marked = os.path.join(os.path.dirname(__file__), "marked.js")
             _node = None
             __all__ = [
                 'markdown2html',
                 'markdown2html_pandoc',
                 'markdown2html_marked',
                 'markdown2html_mistune',
                 'markdown2latex',
                 'markdown2rst',
             ]
             class NodeJSMissing(ConversionException):
                 """Exception raised when node.js is missing."""
                 pass
             def markdown2latex(source):
                 """Convert a markdown string to LaTeX via pandoc.
                 This function will raise an error if pandoc is not installed.
                 Any error messages generated by pandoc are printed to stderr.
                 Parameters
                 ----------
                 source : string
                   Input string, assumed to be valid markdown.
                 Returns
                 -------
                 out : string
                   Output as returned by pandoc.
                 """
                 return pandoc(source, 'markdown', 'latex')
             class MathBlockGrammar(mistune.BlockGrammar):
-                block_math = re.compile("^\$\$(.*?)\$\$")
+                block_math = re.compile("^\$\$(.*?)\$\$", re.DOTALL)
-                block_math2 = re.compile(r"^\\begin(.*?)\\end")
+                latex_environment = re.compile(r"^\\begin\{([a-z]*\*?)\}(.*?)\\end\{\1\}",
+                                                            re.DOTALL)
             class MathBlockLexer(mistune.BlockLexer):
-                default_features = ['block_math', 'block_math2'] + mistune.BlockLexer.default_features
+                default_features = ['block_math', 'latex_environment'] + mistune.BlockLexer.default_features
                 def __init__(self, rules=None, **kwargs):
                     if rules is None:
                         rules = MathBlockGrammar()
                     super(MathBlockLexer, self).__init__(rules, **kwargs)
                 def parse_block_math(self, m):
                     """Parse a $$math$$ block"""
                     self.tokens.append({
                         'type': 'block_math',
                         'text': m.group(1)
                     })
-                parse_block_math2 = parse_block_math
+                def parse_latex_environment(self, m):
+                    self.tokens.append({
+                        'type': 'latex_environment',
+                        'name': m.group(1),
+                        'text': m.group(2)
+                    })
             class MathInlineGrammar(mistune.InlineGrammar):
                 math = re.compile("^\$(.+?)\$")
             class MathInlineLexer(mistune.InlineLexer):
                 default_features = ['math'] + mistune.InlineLexer.default_features
                 def __init__(self, renderer, rules=None, **kwargs):
                     if rules is None:
                         rules = MathInlineGrammar()
                     super(MathInlineLexer, self).__init__(renderer, rules, **kwargs)
                 def output_math(self, m):
-                    self.renderer.inline_math(m.group(1))
+                    return self.renderer.inline_math(m.group(1))
             class MarkdownWithMath(mistune.Markdown):
                 def __init__(self, renderer, **kwargs):
                     if 'inline' not in kwargs:
                         kwargs['inline'] = MathInlineLexer(renderer, **kwargs)
                     if 'block' not in kwargs:
                         kwargs['block'] = MathBlockLexer(**kwargs)
                     super(MarkdownWithMath, self).__init__(renderer, **kwargs)
                 def parse_block_math(self):
                     return self.renderer.block_math(self.token['text'])
+                def parse_latex_environment(self):
+                    return self.renderer.latex_environment(self.token['name'], self.token['text'])
             class IPythonRenderer(mistune.Renderer):
                 def block_code(self, code, lang):
                     if lang:
                         try:
                             lexer = get_lexer_by_name(lang, stripall=True)
                         except ClassNotFound:
                             code = lang + '\n' + code
                             lang = None
                     if not lang:
                         return '\n<pre><code>%s</code></pre>\n' % \
                             mistune.escape(code)
                     formatter = HtmlFormatter()
                     return highlight(code, lexer, formatter)
                 # Pass math through unaltered - mathjax does the rendering in the browser
                 def block_math(self, text):
                     return '$$%s$$' % text
+                def latex_environment(self, name, text):
+                    return r'\begin{%s}%s\end{%s}' % (name, text, name)
                 def inline_math(self, text):
                     return '$%s$' % text
             def markdown2html_mistune(source):
                 """Convert a markdown string to HTML using mistune"""
                 return MarkdownWithMath(renderer=IPythonRenderer()).render(source)
             def markdown2html_pandoc(source):
                 """Convert a markdown string to HTML via pandoc"""
                 return pandoc(source, 'markdown', 'html', extra_args=['--mathjax'])
             def _find_nodejs():
                 global _node
                 if _node is None:
                     # prefer md2html via marked if node.js >= 0.9.12 is available
                     # node is called nodejs on debian, so try that first
                     _node = 'nodejs'
                     if not _verify_node(_node):
                         _node = 'node'
                 return _node
             def markdown2html_marked(source, encoding='utf-8'):
                 """Convert a markdown string to HTML via marked"""
                 command = [_find_nodejs(), marked]
                 try:
                     p = subprocess.Popen(command,
                                          stdin=subprocess.PIPE, stdout=subprocess.PIPE
                     )
                 except OSError as e:
                     raise NodeJSMissing(
                         "The command '%s' returned an error: %s.\n" % (" ".join(command), e) +
                         "Please check that Node.js is installed."
                     )
                 out, _ = p.communicate(cast_bytes(source, encoding))
                 out = TextIOWrapper(BytesIO(out), encoding, 'replace').read()
                 return out.rstrip('\n')
             # The mistune renderer is the default, because it's simple to depend on it
             markdown2html = markdown2html_mistune
             def markdown2rst(source):
                 """Convert a markdown string to ReST via pandoc.
                 This function will raise an error if pandoc is not installed.
                 Any error messages generated by pandoc are printed to stderr.
                 Parameters
                 ----------
                 source : string
                   Input string, assumed to be valid markdown.
                 Returns
                 -------
                 out : string
                   Output as returned by pandoc.
                 """
                 return pandoc(source, 'markdown', 'rst')
             def _verify_node(cmd):
                 """Verify that the node command exists and is at least the minimum supported
                 version of node.
                 Parameters
                 ----------
                 cmd : string
                     Node command to verify (i.e 'node')."""
                 try:
                     out, err, return_code = get_output_error_code([cmd, '--version'])
                 except OSError:
                     # Command not found
                     return False
                 if return_code:
                     # Command error
                     return False
                 return check_version(out.lstrip('v'), '0.9.12')

IPython/nbconvert/filters/tests/test_markdown.py

0 +15 -18

+            """Tests for conversions from markdown to other formats"""
-            """
+            # Copyright (c) IPython Development Team.
-            Module with tests for Markdown
-            """
-            #-----------------------------------------------------------------------------
-            # Copyright (c) 2013, the IPython Development Team.
             # Distributed under the terms of the Modified BSD License.
-            # The full license is in the file COPYING.txt, distributed with this software.
-            #-----------------------------------------------------------------------------
-            #-----------------------------------------------------------------------------
-            # Imports
-            #-----------------------------------------------------------------------------
             from copy import copy
             from IPython.utils.py3compat import string_types
             from IPython.testing import decorators as dec
             from ...tests.base import TestsBase
             from ..markdown import markdown2latex, markdown2html, markdown2rst
-            #-----------------------------------------------------------------------------
-            # Class
-            #-----------------------------------------------------------------------------
             class TestMarkdown(TestsBase):
                 tests = [
                     '*test',
                     '**test',
                     '*test*',
                     '_test_',
                     '__test__',
                     '__*test*__',
                     '**test**',
                     '#test',
                     '##test',
                     'test\n----',
                     'test [link](https://google.com/)']
                 tokens = [
                     '*test',
                     '**test',
                     'test',
                     'test',
                     'test',
                     'test',
                     'test',
                     'test',
                     'test',
                     'test',
                     ('test', 'https://google.com/')]
                 @dec.onlyif_cmds_exist('pandoc')
                 def test_markdown2latex(self):
                     """markdown2latex test"""
                     for index, test in enumerate(self.tests):
                         self._try_markdown(markdown2latex, test, self.tokens[index])
                 def test_markdown2html(self):
                     """markdown2html test"""
                     for index, test in enumerate(self.tests):
                         self._try_markdown(markdown2html, test, self.tokens[index])
+                def test_markdown2html_math(self):
+                    # Mathematical expressions should be passed through unaltered
+                    cases = [("\\begin{equation*}\n"
+                              "\\left( \\sum_{k=1}^n a_k b_k \\right)^2 \\leq \\left( \\sum_{k=1}^n a_k^2 \\right) \\left( \\sum_{k=1}^n b_k^2 \\right)\n"
+                              "\\end{equation*}"),
+                             ("$$\n"
+                              "a = 1 *3* 5\n"
+                              "$$"),
+                              "$ a = 1 *3* 5 $",
+                            ]
+                    for case in cases:
+                        self.assertIn(case, markdown2html(case))
                 @dec.onlyif_cmds_exist('pandoc')
                 def test_markdown2rst(self):
                     """markdown2rst test"""
                     #Modify token array for rst, escape asterik
                     tokens = copy(self.tokens)
                     tokens[0] = r'\*test'
                     tokens[1] = r'\*\*test'
                     for index, test in enumerate(self.tests):
                         self._try_markdown(markdown2rst, test, tokens[index])
                 def _try_markdown(self, method, test, tokens):
                     results = method(test)
                     if isinstance(tokens, string_types):
                         assert tokens in results
                     else:
                         for token in tokens:
                             assert token in results

General Comments 0

Write
Preview

You need to be logged in to leave comments. Login now

No TODOs yet

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages