minirst.py
831 lines
| 28.6 KiB
| text/x-python
|
PythonLexer
/ mercurial / minirst.py
Martin Geisler
|
r9156 | # minirst.py - minimal reStructuredText parser | ||
# | ||||
Martin Geisler
|
r10443 | # Copyright 2009, 2010 Matt Mackall <mpm@selenic.com> and others | ||
Martin Geisler
|
r9156 | # | ||
# This software may be used and distributed according to the terms of the | ||||
Matt Mackall
|
r10263 | # GNU General Public License version 2 or any later version. | ||
Martin Geisler
|
r9156 | |||
"""simplified reStructuredText parser. | ||||
This parser knows just enough about reStructuredText to parse the | ||||
Mercurial docstrings. | ||||
It cheats in a major way: nested blocks are not really nested. They | ||||
are just indented blocks that look like they are nested. This relies | ||||
on the user to keep the right indentation for the blocks. | ||||
Matt Mackall
|
r26421 | Remember to update https://mercurial-scm.org/wiki/HelpStyleGuide | ||
Martin Geisler
|
r12958 | when adding support for new constructs. | ||
Martin Geisler
|
r9156 | """ | ||
Gregory Szorc
|
r25960 | from __future__ import absolute_import | ||
Erik Zielke
|
r12388 | |||
Dan Villiom Podlaski Christiansen
|
r18750 | import cgi | ||
Gregory Szorc
|
r25960 | import re | ||
from .i18n import _ | ||||
from . import ( | ||||
encoding, | ||||
util, | ||||
) | ||||
Dan Villiom Podlaski Christiansen
|
r18750 | |||
Dan Villiom Podlaski Christiansen
|
r18748 | def section(s): | ||
return "%s\n%s\n\n" % (s, "\"" * encoding.colwidth(s)) | ||||
def subsection(s): | ||||
return "%s\n%s\n\n" % (s, '=' * encoding.colwidth(s)) | ||||
def subsubsection(s): | ||||
return "%s\n%s\n\n" % (s, "-" * encoding.colwidth(s)) | ||||
def subsubsubsection(s): | ||||
return "%s\n%s\n\n" % (s, "." * encoding.colwidth(s)) | ||||
FUJIWARA Katsunori
|
r11464 | def replace(text, substs): | ||
FUJIWARA Katsunori
|
r15393 | ''' | ||
Apply a list of (find, replace) pairs to a text. | ||||
>>> replace("foo bar", [('f', 'F'), ('b', 'B')]) | ||||
'Foo Bar' | ||||
>>> encoding.encoding = 'latin1' | ||||
>>> replace('\\x81\\\\', [('\\\\', '/')]) | ||||
'\\x81/' | ||||
>>> encoding.encoding = 'shiftjis' | ||||
>>> replace('\\x81\\\\', [('\\\\', '/')]) | ||||
'\\x81\\\\' | ||||
''' | ||||
# some character encodings (cp932 for Japanese, at least) use | ||||
# ASCII characters other than control/alphabet/digit as a part of | ||||
# multi-bytes characters, so direct replacing with such characters | ||||
# on strings in local encoding causes invalid byte sequences. | ||||
utext = text.decode(encoding.encoding) | ||||
FUJIWARA Katsunori
|
r11464 | for f, t in substs: | ||
Matt Mackall
|
r21745 | utext = utext.replace(f.decode("ascii"), t.decode("ascii")) | ||
FUJIWARA Katsunori
|
r15393 | return utext.encode(encoding.encoding) | ||
Martin Geisler
|
r12651 | |||
_blockre = re.compile(r"\n(?:\s*\n)+") | ||||
Martin Geisler
|
r9156 | def findblocks(text): | ||
"""Find continuous blocks of lines in text. | ||||
Returns a list of dictionaries representing the blocks. Each block | ||||
has an 'indent' field and a 'lines' field. | ||||
""" | ||||
Martin Geisler
|
r12651 | blocks = [] | ||
Matt Mackall
|
r15036 | for b in _blockre.split(text.lstrip('\n').rstrip()): | ||
Martin Geisler
|
r12651 | lines = b.splitlines() | ||
Matt Mackall
|
r15123 | if lines: | ||
indent = min((len(l) - len(l.lstrip())) for l in lines) | ||||
lines = [l[indent:] for l in lines] | ||||
Augie Fackler
|
r20682 | blocks.append({'indent': indent, 'lines': lines}) | ||
Martin Geisler
|
r9156 | return blocks | ||
def findliteralblocks(blocks): | ||||
"""Finds literal blocks and adds a 'type' field to the blocks. | ||||
Literal blocks are given the type 'literal', all other blocks are | ||||
given type the 'paragraph'. | ||||
""" | ||||
i = 0 | ||||
while i < len(blocks): | ||||
# Searching for a block that looks like this: | ||||
# | ||||
# +------------------------------+ | ||||
# | paragraph | | ||||
# | (ends with "::") | | ||||
# +------------------------------+ | ||||
# +---------------------------+ | ||||
# | indented literal block | | ||||
# +---------------------------+ | ||||
blocks[i]['type'] = 'paragraph' | ||||
Matt Mackall
|
r10282 | if blocks[i]['lines'][-1].endswith('::') and i + 1 < len(blocks): | ||
Martin Geisler
|
r9156 | indent = blocks[i]['indent'] | ||
Matt Mackall
|
r10282 | adjustment = blocks[i + 1]['indent'] - indent | ||
Martin Geisler
|
r9156 | |||
if blocks[i]['lines'] == ['::']: | ||||
# Expanded form: remove block | ||||
del blocks[i] | ||||
i -= 1 | ||||
elif blocks[i]['lines'][-1].endswith(' ::'): | ||||
# Partially minimized form: remove space and both | ||||
# colons. | ||||
blocks[i]['lines'][-1] = blocks[i]['lines'][-1][:-3] | ||||
Simon Heimberg
|
r19992 | elif len(blocks[i]['lines']) == 1 and \ | ||
blocks[i]['lines'][0].lstrip(' ').startswith('.. ') and \ | ||||
blocks[i]['lines'][0].find(' ', 3) == -1: | ||||
Mads Kiilerich
|
r20549 | # directive on its own line, not a literal block | ||
Simon Heimberg
|
r19992 | i += 1 | ||
continue | ||||
Martin Geisler
|
r9156 | else: | ||
# Fully minimized form: remove just one colon. | ||||
blocks[i]['lines'][-1] = blocks[i]['lines'][-1][:-1] | ||||
# List items are formatted with a hanging indent. We must | ||||
# correct for this here while we still have the original | ||||
# information on the indentation of the subsequent literal | ||||
# blocks available. | ||||
Martin Geisler
|
r9738 | m = _bulletre.match(blocks[i]['lines'][0]) | ||
if m: | ||||
indent += m.end() | ||||
adjustment -= m.end() | ||||
Martin Geisler
|
r9156 | |||
# Mark the following indented blocks. | ||||
Matt Mackall
|
r10282 | while i + 1 < len(blocks) and blocks[i + 1]['indent'] > indent: | ||
blocks[i + 1]['type'] = 'literal' | ||||
blocks[i + 1]['indent'] -= adjustment | ||||
Martin Geisler
|
r9156 | i += 1 | ||
i += 1 | ||||
return blocks | ||||
Gregory Szorc
|
r31130 | _bulletre = re.compile(r'(\*|-|[0-9A-Za-z]+\.|\(?[0-9A-Za-z]+\)|\|) ') | ||
Erik Zielke
|
r13011 | _optionre = re.compile(r'^(-([a-zA-Z0-9]), )?(--[a-z0-9-]+)' | ||
r'((.*) +)(.*)$') | ||||
Martin Geisler
|
r10065 | _fieldre = re.compile(r':(?![: ])([^:]*)(?<! ):[ ]+(.*)') | ||
Martin Geisler
|
r9737 | _definitionre = re.compile(r'[^ ]') | ||
Matt Mackall
|
r15037 | _tablere = re.compile(r'(=+\s+)*=+') | ||
Martin Geisler
|
r9737 | |||
def splitparagraphs(blocks): | ||||
"""Split paragraphs into lists.""" | ||||
# Tuples with (list type, item regexp, single line items?). Order | ||||
# matters: definition lists has the least specific regexp and must | ||||
# come last. | ||||
listtypes = [('bullet', _bulletre, True), | ||||
('option', _optionre, True), | ||||
('field', _fieldre, True), | ||||
('definition', _definitionre, False)] | ||||
def match(lines, i, itemre, singleline): | ||||
"""Does itemre match an item at line i? | ||||
Mads Kiilerich
|
r17424 | A list item can be followed by an indented line or another list | ||
Martin Geisler
|
r9737 | item (but only if singleline is True). | ||
""" | ||||
line1 = lines[i] | ||||
Matt Mackall
|
r10282 | line2 = i + 1 < len(lines) and lines[i + 1] or '' | ||
Martin Geisler
|
r9737 | if not itemre.match(line1): | ||
return False | ||||
if singleline: | ||||
return line2 == '' or line2[0] == ' ' or itemre.match(line2) | ||||
else: | ||||
return line2.startswith(' ') | ||||
i = 0 | ||||
while i < len(blocks): | ||||
if blocks[i]['type'] == 'paragraph': | ||||
lines = blocks[i]['lines'] | ||||
for type, itemre, singleline in listtypes: | ||||
if match(lines, 0, itemre, singleline): | ||||
items = [] | ||||
for j, line in enumerate(lines): | ||||
if match(lines, j, itemre, singleline): | ||||
Augie Fackler
|
r20682 | items.append({'type': type, 'lines': [], | ||
'indent': blocks[i]['indent']}) | ||||
Martin Geisler
|
r9737 | items[-1]['lines'].append(line) | ||
Matt Mackall
|
r10282 | blocks[i:i + 1] = items | ||
Martin Geisler
|
r9737 | break | ||
i += 1 | ||||
return blocks | ||||
Olav Reinert
|
r15861 | _fieldwidth = 14 | ||
Martin Geisler
|
r10065 | |||
def updatefieldlists(blocks): | ||||
Olav Reinert
|
r15861 | """Find key for field lists.""" | ||
Martin Geisler
|
r10065 | i = 0 | ||
while i < len(blocks): | ||||
if blocks[i]['type'] != 'field': | ||||
i += 1 | ||||
continue | ||||
j = i | ||||
while j < len(blocks) and blocks[j]['type'] == 'field': | ||||
m = _fieldre.match(blocks[j]['lines'][0]) | ||||
key, rest = m.groups() | ||||
blocks[j]['lines'][0] = rest | ||||
blocks[j]['key'] = key | ||||
j += 1 | ||||
i = j + 1 | ||||
return blocks | ||||
Erik Zielke
|
r13011 | def updateoptionlists(blocks): | ||
i = 0 | ||||
while i < len(blocks): | ||||
if blocks[i]['type'] != 'option': | ||||
i += 1 | ||||
continue | ||||
optstrwidth = 0 | ||||
j = i | ||||
while j < len(blocks) and blocks[j]['type'] == 'option': | ||||
m = _optionre.match(blocks[j]['lines'][0]) | ||||
shortoption = m.group(2) | ||||
group3 = m.group(3) | ||||
longoption = group3[2:].strip() | ||||
desc = m.group(6).strip() | ||||
longoptionarg = m.group(5).strip() | ||||
blocks[j]['lines'][0] = desc | ||||
noshortop = '' | ||||
if not shortoption: | ||||
noshortop = ' ' | ||||
opt = "%s%s" % (shortoption and "-%s " % shortoption or '', | ||||
("%s--%s %s") % (noshortop, longoption, | ||||
longoptionarg)) | ||||
opt = opt.rstrip() | ||||
blocks[j]['optstr'] = opt | ||||
optstrwidth = max(optstrwidth, encoding.colwidth(opt)) | ||||
j += 1 | ||||
for block in blocks[i:j]: | ||||
block['optstrwidth'] = optstrwidth | ||||
i = j + 1 | ||||
return blocks | ||||
Martin Geisler
|
r10443 | def prunecontainers(blocks, keep): | ||
"""Prune unwanted containers. | ||||
The blocks must have a 'type' field, i.e., they should have been | ||||
run through findliteralblocks first. | ||||
""" | ||||
Martin Geisler
|
r10444 | pruned = [] | ||
Martin Geisler
|
r10443 | i = 0 | ||
while i + 1 < len(blocks): | ||||
# Searching for a block that looks like this: | ||||
# | ||||
# +-------+---------------------------+ | ||||
# | ".. container ::" type | | ||||
# +---+ | | ||||
# | blocks | | ||||
# +-------------------------------+ | ||||
if (blocks[i]['type'] == 'paragraph' and | ||||
blocks[i]['lines'][0].startswith('.. container::')): | ||||
indent = blocks[i]['indent'] | ||||
adjustment = blocks[i + 1]['indent'] - indent | ||||
containertype = blocks[i]['lines'][0][15:] | ||||
Matt Mackall
|
r22584 | prune = True | ||
for c in keep: | ||||
if c in containertype.split('.'): | ||||
prune = False | ||||
Martin Geisler
|
r10444 | if prune: | ||
pruned.append(containertype) | ||||
Martin Geisler
|
r10443 | |||
# Always delete "..container:: type" block | ||||
del blocks[i] | ||||
j = i | ||||
Matt Mackall
|
r15102 | i -= 1 | ||
Martin Geisler
|
r10443 | while j < len(blocks) and blocks[j]['indent'] > indent: | ||
if prune: | ||||
del blocks[j] | ||||
else: | ||||
blocks[j]['indent'] -= adjustment | ||||
j += 1 | ||||
i += 1 | ||||
Martin Geisler
|
r10444 | return blocks, pruned | ||
Martin Geisler
|
r10443 | |||
Martin Geisler
|
r10984 | _sectionre = re.compile(r"""^([-=`:.'"~^_*+#])\1+$""") | ||
Matt Mackall
|
r15037 | def findtables(blocks): | ||
'''Find simple tables | ||||
Only simple one-line table elements are supported | ||||
''' | ||||
for block in blocks: | ||||
# Searching for a block that looks like this: | ||||
# | ||||
# === ==== === | ||||
# A B C | ||||
# === ==== === <- optional | ||||
# 1 2 3 | ||||
# x y z | ||||
# === ==== === | ||||
if (block['type'] == 'paragraph' and | ||||
Matt Mackall
|
r15192 | len(block['lines']) > 2 and | ||
Matt Mackall
|
r15037 | _tablere.match(block['lines'][0]) and | ||
block['lines'][0] == block['lines'][-1]): | ||||
block['type'] = 'table' | ||||
block['header'] = False | ||||
div = block['lines'][0] | ||||
Matt Mackall
|
r15144 | |||
# column markers are ASCII so we can calculate column | ||||
# position in bytes | ||||
Matt Mackall
|
r15037 | columns = [x for x in xrange(len(div)) | ||
if div[x] == '=' and (x == 0 or div[x - 1] == ' ')] | ||||
rows = [] | ||||
for l in block['lines'][1:-1]: | ||||
if l == div: | ||||
block['header'] = True | ||||
continue | ||||
row = [] | ||||
Matt Mackall
|
r15144 | # we measure columns not in bytes or characters but in | ||
# colwidth which makes things tricky | ||||
pos = columns[0] # leading whitespace is bytes | ||||
Matt Mackall
|
r15037 | for n, start in enumerate(columns): | ||
if n + 1 < len(columns): | ||||
Matt Mackall
|
r15144 | width = columns[n + 1] - start | ||
v = encoding.getcols(l, pos, width) # gather columns | ||||
pos += len(v) # calculate byte position of end | ||||
row.append(v.strip()) | ||||
Matt Mackall
|
r15037 | else: | ||
Matt Mackall
|
r15144 | row.append(l[pos:].strip()) | ||
Matt Mackall
|
r15037 | rows.append(row) | ||
Matt Mackall
|
r15144 | |||
Matt Mackall
|
r15037 | block['table'] = rows | ||
return blocks | ||||
Martin Geisler
|
r9156 | def findsections(blocks): | ||
"""Finds sections. | ||||
The blocks must have a 'type' field, i.e., they should have been | ||||
run through findliteralblocks first. | ||||
""" | ||||
for block in blocks: | ||||
# Searching for a block that looks like this: | ||||
# | ||||
# +------------------------------+ | ||||
# | Section title | | ||||
# | ------------- | | ||||
# +------------------------------+ | ||||
if (block['type'] == 'paragraph' and | ||||
len(block['lines']) == 2 and | ||||
Matt Mackall
|
r12867 | encoding.colwidth(block['lines'][0]) == len(block['lines'][1]) and | ||
Martin Geisler
|
r10984 | _sectionre.match(block['lines'][1])): | ||
Martin Geisler
|
r10983 | block['underline'] = block['lines'][1][0] | ||
Martin Geisler
|
r9156 | block['type'] = 'section' | ||
Martin Geisler
|
r10983 | del block['lines'][1] | ||
Martin Geisler
|
r9156 | return blocks | ||
Martin Geisler
|
r9623 | def inlineliterals(blocks): | ||
FUJIWARA Katsunori
|
r11464 | substs = [('``', '"')] | ||
Martin Geisler
|
r9623 | for b in blocks: | ||
Martin Geisler
|
r10983 | if b['type'] in ('paragraph', 'section'): | ||
FUJIWARA Katsunori
|
r11464 | b['lines'] = [replace(l, substs) for l in b['lines']] | ||
Martin Geisler
|
r9623 | return blocks | ||
Martin Geisler
|
r10972 | def hgrole(blocks): | ||
timeless
|
r27729 | substs = [(':hg:`', "'hg "), ('`', "'")] | ||
Martin Geisler
|
r10972 | for b in blocks: | ||
Martin Geisler
|
r10983 | if b['type'] in ('paragraph', 'section'): | ||
Martin Geisler
|
r11192 | # Turn :hg:`command` into "hg command". This also works | ||
# when there is a line break in the command and relies on | ||||
# the fact that we have no stray back-quotes in the input | ||||
# (run the blocks through inlineliterals first). | ||||
FUJIWARA Katsunori
|
r11464 | b['lines'] = [replace(l, substs) for l in b['lines']] | ||
Martin Geisler
|
r10972 | return blocks | ||
Martin Geisler
|
r9156 | def addmargins(blocks): | ||
"""Adds empty blocks for vertical spacing. | ||||
This groups bullets, options, and definitions together with no vertical | ||||
space between them, and adds an empty block between all other blocks. | ||||
""" | ||||
i = 1 | ||||
while i < len(blocks): | ||||
Matt Mackall
|
r10282 | if (blocks[i]['type'] == blocks[i - 1]['type'] and | ||
Martin Geisler
|
r10936 | blocks[i]['type'] in ('bullet', 'option', 'field')): | ||
Martin Geisler
|
r9156 | i += 1 | ||
Simon Heimberg
|
r19995 | elif not blocks[i - 1]['lines']: | ||
Mads Kiilerich
|
r20549 | # no lines in previous block, do not separate | ||
Simon Heimberg
|
r19995 | i += 1 | ||
Martin Geisler
|
r9156 | else: | ||
Augie Fackler
|
r20682 | blocks.insert(i, {'lines': [''], 'indent': 0, 'type': 'margin'}) | ||
Martin Geisler
|
r9156 | i += 2 | ||
return blocks | ||||
Martin Geisler
|
r12819 | def prunecomments(blocks): | ||
"""Remove comments.""" | ||||
i = 0 | ||||
while i < len(blocks): | ||||
b = blocks[i] | ||||
Erik Zielke
|
r13009 | if b['type'] == 'paragraph' and (b['lines'][0].startswith('.. ') or | ||
b['lines'] == ['..']): | ||||
Martin Geisler
|
r12819 | del blocks[i] | ||
Martin Geisler
|
r13003 | if i < len(blocks) and blocks[i]['type'] == 'margin': | ||
del blocks[i] | ||||
Martin Geisler
|
r12819 | else: | ||
i += 1 | ||||
return blocks | ||||
Gregory Szorc
|
r31131 | |||
_admonitions = set([ | ||||
'admonition', | ||||
'attention', | ||||
'caution', | ||||
'danger', | ||||
'error', | ||||
'hint', | ||||
'important', | ||||
'note', | ||||
'tip', | ||||
'warning', | ||||
]) | ||||
Martin Geisler
|
r12620 | |||
Gregory Szorc
|
r31132 | def findadmonitions(blocks, admonitions=None): | ||
Erik Zielke
|
r12388 | """ | ||
Makes the type of the block an admonition block if | ||||
the first line is an admonition directive | ||||
""" | ||||
Gregory Szorc
|
r31132 | admonitions = admonitions or _admonitions | ||
admonitionre = re.compile(r'\.\. (%s)::' % '|'.join(sorted(admonitions)), | ||||
Gregory Szorc
|
r31131 | flags=re.IGNORECASE) | ||
Erik Zielke
|
r12388 | i = 0 | ||
while i < len(blocks): | ||||
Gregory Szorc
|
r31131 | m = admonitionre.match(blocks[i]['lines'][0]) | ||
Erik Zielke
|
r12388 | if m: | ||
blocks[i]['type'] = 'admonition' | ||||
admonitiontitle = blocks[i]['lines'][0][3:m.end() - 2].lower() | ||||
firstline = blocks[i]['lines'][0][m.end() + 1:] | ||||
Martin Geisler
|
r12620 | if firstline: | ||
blocks[i]['lines'].insert(1, ' ' + firstline) | ||||
Erik Zielke
|
r12388 | |||
blocks[i]['admonitiontitle'] = admonitiontitle | ||||
del blocks[i]['lines'][0] | ||||
i = i + 1 | ||||
return blocks | ||||
Martin Geisler
|
r9156 | |||
Martin Geisler
|
r12652 | _admonitiontitles = {'attention': _('Attention:'), | ||
'caution': _('Caution:'), | ||||
'danger': _('!Danger!') , | ||||
'error': _('Error:'), | ||||
'hint': _('Hint:'), | ||||
'important': _('Important:'), | ||||
'note': _('Note:'), | ||||
'tip': _('Tip:'), | ||||
'warning': _('Warning!')} | ||||
Erik Zielke
|
r13011 | def formatoption(block, width): | ||
desc = ' '.join(map(str.strip, block['lines'])) | ||||
colwidth = encoding.colwidth(block['optstr']) | ||||
usablewidth = width - 1 | ||||
hanging = block['optstrwidth'] | ||||
initindent = '%s%s ' % (block['optstr'], ' ' * ((hanging - colwidth))) | ||||
hangindent = ' ' * (encoding.colwidth(initindent) + 1) | ||||
Matt Mackall
|
r15125 | return ' %s\n' % (util.wrap(desc, usablewidth, | ||
Erik Zielke
|
r13011 | initindent=initindent, | ||
hangindent=hangindent)) | ||||
Martin Geisler
|
r9156 | def formatblock(block, width): | ||
"""Format a block according to width.""" | ||||
Martin Geisler
|
r9417 | if width <= 0: | ||
width = 78 | ||||
Martin Geisler
|
r9156 | indent = ' ' * block['indent'] | ||
Erik Zielke
|
r12388 | if block['type'] == 'admonition': | ||
Martin Geisler
|
r12652 | admonition = _admonitiontitles[block['admonitiontitle']] | ||
Simon Heimberg
|
r19993 | if not block['lines']: | ||
return indent + admonition + '\n' | ||||
Erik Zielke
|
r12388 | hang = len(block['lines'][-1]) - len(block['lines'][-1].lstrip()) | ||
defindent = indent + hang * ' ' | ||||
text = ' '.join(map(str.strip, block['lines'])) | ||||
Matt Mackall
|
r15125 | return '%s\n%s\n' % (indent + admonition, | ||
util.wrap(text, width=width, | ||||
initindent=defindent, | ||||
hangindent=defindent)) | ||||
Martin Geisler
|
r9156 | if block['type'] == 'margin': | ||
Matt Mackall
|
r15125 | return '\n' | ||
Martin Geisler
|
r9735 | if block['type'] == 'literal': | ||
Martin Geisler
|
r9291 | indent += ' ' | ||
Matt Mackall
|
r15125 | return indent + ('\n' + indent).join(block['lines']) + '\n' | ||
Martin Geisler
|
r9735 | if block['type'] == 'section': | ||
Matt Mackall
|
r12867 | underline = encoding.colwidth(block['lines'][0]) * block['underline'] | ||
Matt Mackall
|
r15125 | return "%s%s\n%s%s\n" % (indent, block['lines'][0],indent, underline) | ||
Matt Mackall
|
r15037 | if block['type'] == 'table': | ||
table = block['table'] | ||||
# compute column widths | ||||
widths = [max([encoding.colwidth(e) for e in c]) for c in zip(*table)] | ||||
text = '' | ||||
span = sum(widths) + len(widths) - 1 | ||||
indent = ' ' * block['indent'] | ||||
hang = ' ' * (len(indent) + span - widths[-1]) | ||||
for row in table: | ||||
Matt Mackall
|
r15144 | l = [] | ||
for w, v in zip(widths, row): | ||||
pad = ' ' * (w - encoding.colwidth(v)) | ||||
l.append(v + pad) | ||||
l = ' '.join(l) | ||||
Matt Mackall
|
r15037 | l = util.wrap(l, width=width, initindent=indent, hangindent=hang) | ||
if not text and block['header']: | ||||
text = l + '\n' + indent + '-' * (min(width, span)) + '\n' | ||||
else: | ||||
text += l + "\n" | ||||
return text | ||||
Martin Geisler
|
r9735 | if block['type'] == 'definition': | ||
Martin Geisler
|
r9156 | term = indent + block['lines'][0] | ||
Martin Geisler
|
r9737 | hang = len(block['lines'][-1]) - len(block['lines'][-1].lstrip()) | ||
defindent = indent + hang * ' ' | ||||
Martin Geisler
|
r9156 | text = ' '.join(map(str.strip, block['lines'][1:])) | ||
Matt Mackall
|
r15125 | return '%s\n%s\n' % (term, util.wrap(text, width=width, | ||
initindent=defindent, | ||||
hangindent=defindent)) | ||||
Martin Geisler
|
r10937 | subindent = indent | ||
Martin Geisler
|
r9735 | if block['type'] == 'bullet': | ||
Martin Geisler
|
r10447 | if block['lines'][0].startswith('| '): | ||
# Remove bullet for line blocks and add no extra | ||||
Mads Kiilerich
|
r26781 | # indentation. | ||
Martin Geisler
|
r10447 | block['lines'][0] = block['lines'][0][2:] | ||
else: | ||||
m = _bulletre.match(block['lines'][0]) | ||||
subindent = indent + m.end() * ' ' | ||||
Martin Geisler
|
r9737 | elif block['type'] == 'field': | ||
Martin Geisler
|
r10065 | key = block['key'] | ||
subindent = indent + _fieldwidth * ' ' | ||||
if len(key) + 2 > _fieldwidth: | ||||
# key too large, use full line width | ||||
key = key.ljust(width) | ||||
else: | ||||
Olav Reinert
|
r15861 | # key fits within field width | ||
Martin Geisler
|
r10065 | key = key.ljust(_fieldwidth) | ||
block['lines'][0] = key + block['lines'][0] | ||||
Martin Geisler
|
r9737 | elif block['type'] == 'option': | ||
Erik Zielke
|
r13011 | return formatoption(block, width) | ||
Martin Geisler
|
r9156 | |||
Martin Geisler
|
r9737 | text = ' '.join(map(str.strip, block['lines'])) | ||
FUJIWARA Katsunori
|
r11297 | return util.wrap(text, width=width, | ||
initindent=indent, | ||||
Matt Mackall
|
r15125 | hangindent=subindent) + '\n' | ||
Martin Geisler
|
r9156 | |||
Matt Mackall
|
r15261 | def formathtml(blocks): | ||
"""Format RST blocks as HTML""" | ||||
out = [] | ||||
headernest = '' | ||||
listnest = [] | ||||
Dan Villiom Podlaski Christiansen
|
r18750 | def escape(s): | ||
return cgi.escape(s, True) | ||||
Matt Mackall
|
r15261 | def openlist(start, level): | ||
if not listnest or listnest[-1][0] != start: | ||||
listnest.append((start, level)) | ||||
out.append('<%s>\n' % start) | ||||
blocks = [b for b in blocks if b['type'] != 'margin'] | ||||
for pos, b in enumerate(blocks): | ||||
btype = b['type'] | ||||
level = b['indent'] | ||||
lines = b['lines'] | ||||
if btype == 'admonition': | ||||
Dan Villiom Podlaski Christiansen
|
r18750 | admonition = escape(_admonitiontitles[b['admonitiontitle']]) | ||
text = escape(' '.join(map(str.strip, lines))) | ||||
Matt Mackall
|
r15261 | out.append('<p>\n<b>%s</b> %s\n</p>\n' % (admonition, text)) | ||
elif btype == 'paragraph': | ||||
Dan Villiom Podlaski Christiansen
|
r18750 | out.append('<p>\n%s\n</p>\n' % escape('\n'.join(lines))) | ||
Matt Mackall
|
r15261 | elif btype == 'margin': | ||
pass | ||||
elif btype == 'literal': | ||||
Dan Villiom Podlaski Christiansen
|
r18750 | out.append('<pre>\n%s\n</pre>\n' % escape('\n'.join(lines))) | ||
Matt Mackall
|
r15261 | elif btype == 'section': | ||
i = b['underline'] | ||||
if i not in headernest: | ||||
headernest += i | ||||
level = headernest.index(i) + 1 | ||||
Dan Villiom Podlaski Christiansen
|
r18750 | out.append('<h%d>%s</h%d>\n' % (level, escape(lines[0]), level)) | ||
Matt Mackall
|
r15261 | elif btype == 'table': | ||
table = b['table'] | ||||
Dan Villiom Podlaski Christiansen
|
r18752 | out.append('<table>\n') | ||
Matt Mackall
|
r15261 | for row in table: | ||
Dan Villiom Podlaski Christiansen
|
r18752 | out.append('<tr>') | ||
Dan Villiom Podlaski Christiansen
|
r18750 | for v in row: | ||
Dan Villiom Podlaski Christiansen
|
r18752 | out.append('<td>') | ||
out.append(escape(v)) | ||||
out.append('</td>') | ||||
out.append('\n') | ||||
out.pop() | ||||
out.append('</tr>\n') | ||||
out.append('</table>\n') | ||||
Matt Mackall
|
r15261 | elif btype == 'definition': | ||
openlist('dl', level) | ||||
Dan Villiom Podlaski Christiansen
|
r18750 | term = escape(lines[0]) | ||
text = escape(' '.join(map(str.strip, lines[1:]))) | ||||
Matt Mackall
|
r15261 | out.append(' <dt>%s\n <dd>%s\n' % (term, text)) | ||
elif btype == 'bullet': | ||||
bullet, head = lines[0].split(' ', 1) | ||||
Gregory Szorc
|
r31130 | if bullet in ('*', '-'): | ||
Matt Mackall
|
r15261 | openlist('ul', level) | ||
else: | ||||
openlist('ol', level) | ||||
Dan Villiom Podlaski Christiansen
|
r18750 | out.append(' <li> %s\n' % escape(' '.join([head] + lines[1:]))) | ||
Matt Mackall
|
r15261 | elif btype == 'field': | ||
openlist('dl', level) | ||||
Dan Villiom Podlaski Christiansen
|
r18750 | key = escape(b['key']) | ||
text = escape(' '.join(map(str.strip, lines))) | ||||
Matt Mackall
|
r15261 | out.append(' <dt>%s\n <dd>%s\n' % (key, text)) | ||
elif btype == 'option': | ||||
openlist('dl', level) | ||||
Dan Villiom Podlaski Christiansen
|
r18750 | opt = escape(b['optstr']) | ||
desc = escape(' '.join(map(str.strip, lines))) | ||||
Matt Mackall
|
r15261 | out.append(' <dt>%s\n <dd>%s\n' % (opt, desc)) | ||
# close lists if indent level of next block is lower | ||||
if listnest: | ||||
start, level = listnest[-1] | ||||
if pos == len(blocks) - 1: | ||||
out.append('</%s>\n' % start) | ||||
listnest.pop() | ||||
else: | ||||
nb = blocks[pos + 1] | ||||
ni = nb['indent'] | ||||
if (ni < level or | ||||
(ni == level and | ||||
nb['type'] not in 'definition bullet field option')): | ||||
out.append('</%s>\n' % start) | ||||
listnest.pop() | ||||
return ''.join(out) | ||||
Gregory Szorc
|
r31132 | def parse(text, indent=0, keep=None, admonitions=None): | ||
Matt Mackall
|
r15012 | """Parse text into a list of blocks""" | ||
pruned = [] | ||||
Martin Geisler
|
r9156 | blocks = findblocks(text) | ||
Martin Geisler
|
r9540 | for b in blocks: | ||
b['indent'] += indent | ||||
Martin Geisler
|
r9156 | blocks = findliteralblocks(blocks) | ||
Matt Mackall
|
r15037 | blocks = findtables(blocks) | ||
Martin Geisler
|
r10444 | blocks, pruned = prunecontainers(blocks, keep or []) | ||
Martin Geisler
|
r10983 | blocks = findsections(blocks) | ||
Martin Geisler
|
r9623 | blocks = inlineliterals(blocks) | ||
Martin Geisler
|
r10972 | blocks = hgrole(blocks) | ||
Martin Geisler
|
r9737 | blocks = splitparagraphs(blocks) | ||
Martin Geisler
|
r10065 | blocks = updatefieldlists(blocks) | ||
Erik Zielke
|
r13011 | blocks = updateoptionlists(blocks) | ||
Gregory Szorc
|
r31132 | blocks = findadmonitions(blocks, admonitions=admonitions) | ||
Martin Geisler
|
r13003 | blocks = addmargins(blocks) | ||
Martin Geisler
|
r12819 | blocks = prunecomments(blocks) | ||
Matt Mackall
|
r15012 | return blocks, pruned | ||
Matt Mackall
|
r15013 | def formatblocks(blocks, width): | ||
Matt Mackall
|
r15125 | text = ''.join(formatblock(b, width) for b in blocks) | ||
Matt Mackall
|
r15013 | return text | ||
Matt Mackall
|
r22587 | def format(text, width=80, indent=0, keep=None, style='plain', section=None): | ||
Matt Mackall
|
r15012 | """Parse and format the text according to width.""" | ||
blocks, pruned = parse(text, indent, keep or []) | ||||
timeless@mozdev.org
|
r26113 | parents = [] | ||
Matt Mackall
|
r22587 | if section: | ||
sections = getsections(blocks) | ||||
blocks = [] | ||||
Jordi Gutiérrez Hermoso
|
r22770 | i = 0 | ||
timeless
|
r27614 | lastparents = [] | ||
synthetic = [] | ||||
collapse = True | ||||
Jordi Gutiérrez Hermoso
|
r22770 | while i < len(sections): | ||
name, nest, b = sections[i] | ||||
timeless@mozdev.org
|
r26113 | del parents[nest:] | ||
timeless
|
r27614 | parents.append(i) | ||
Matt Mackall
|
r22587 | if name == section: | ||
timeless
|
r27614 | if lastparents != parents: | ||
llen = len(lastparents) | ||||
plen = len(parents) | ||||
if llen and llen != plen: | ||||
collapse = False | ||||
s = [] | ||||
for j in xrange(3, plen - 1): | ||||
parent = parents[j] | ||||
if (j >= llen or | ||||
lastparents[j] != parent): | ||||
s.append(len(blocks)) | ||||
sec = sections[parent][2] | ||||
blocks.append(sec[0]) | ||||
blocks.append(sec[-1]) | ||||
if s: | ||||
synthetic.append(s) | ||||
lastparents = parents[:] | ||||
Jordi Gutiérrez Hermoso
|
r22770 | blocks.extend(b) | ||
## Also show all subnested sections | ||||
while i + 1 < len(sections) and sections[i + 1][1] > nest: | ||||
i += 1 | ||||
blocks.extend(sections[i][2]) | ||||
i += 1 | ||||
timeless
|
r27614 | if collapse: | ||
synthetic.reverse() | ||||
for s in synthetic: | ||||
Augie Fackler
|
r30390 | path = [blocks[syn]['lines'][0] for syn in s] | ||
timeless
|
r27614 | real = s[-1] + 2 | ||
realline = blocks[real]['lines'] | ||||
realline[0] = ('"%s"' % | ||||
'.'.join(path + [realline[0]]).replace('"', '')) | ||||
del blocks[s[0]:real] | ||||
Jordi Gutiérrez Hermoso
|
r22770 | |||
Matt Mackall
|
r15262 | if style == 'html': | ||
text = formathtml(blocks) | ||||
else: | ||||
text = ''.join(formatblock(b, width) for b in blocks) | ||||
Martin Geisler
|
r10444 | if keep is None: | ||
return text | ||||
else: | ||||
return text, pruned | ||||
Martin Geisler
|
r9156 | |||
Matt Mackall
|
r15014 | def getsections(blocks): | ||
'''return a list of (section name, nesting level, blocks) tuples''' | ||||
nest = "" | ||||
level = 0 | ||||
secs = [] | ||||
Matt Mackall
|
r22587 | |||
def getname(b): | ||||
Matt Harbison
|
r25723 | if b['type'] == 'field': | ||
x = b['key'] | ||||
else: | ||||
x = b['lines'][0] | ||||
FUJIWARA Katsunori
|
r29155 | x = encoding.lower(x).strip('"') | ||
Matt Mackall
|
r22587 | if '(' in x: | ||
x = x.split('(')[0] | ||||
return x | ||||
Matt Mackall
|
r15014 | for b in blocks: | ||
if b['type'] == 'section': | ||||
i = b['underline'] | ||||
if i not in nest: | ||||
nest += i | ||||
level = nest.index(i) + 1 | ||||
nest = nest[:level] | ||||
Matt Mackall
|
r22587 | secs.append((getname(b), level, [b])) | ||
Matt Harbison
|
r25723 | elif b['type'] in ('definition', 'field'): | ||
Matt Mackall
|
r22587 | i = ' ' | ||
if i not in nest: | ||||
nest += i | ||||
level = nest.index(i) + 1 | ||||
nest = nest[:level] | ||||
timeless@mozdev.org
|
r26237 | for i in range(1, len(secs) + 1): | ||
sec = secs[-i] | ||||
if sec[1] < level: | ||||
break | ||||
siblings = [a for a in sec[2] if a['type'] == 'definition'] | ||||
if siblings: | ||||
siblingindent = siblings[-1]['indent'] | ||||
indent = b['indent'] | ||||
if siblingindent < indent: | ||||
level += 1 | ||||
break | ||||
elif siblingindent == indent: | ||||
level = sec[1] | ||||
break | ||||
Matt Mackall
|
r22587 | secs.append((getname(b), level, [b])) | ||
Matt Mackall
|
r15014 | else: | ||
if not secs: | ||||
# add an initial empty section | ||||
secs = [('', 0, [])] | ||||
timeless@mozdev.org
|
r26157 | if b['type'] != 'margin': | ||
pointer = 1 | ||||
bindent = b['indent'] | ||||
while pointer < len(secs): | ||||
section = secs[-pointer][2][0] | ||||
if section['type'] != 'margin': | ||||
sindent = section['indent'] | ||||
if len(section['lines']) > 1: | ||||
sindent += len(section['lines'][1]) - \ | ||||
len(section['lines'][1].lstrip(' ')) | ||||
if bindent >= sindent: | ||||
break | ||||
pointer += 1 | ||||
if pointer > 1: | ||||
timeless@mozdev.org
|
r26170 | blevel = secs[-pointer][1] | ||
if section['type'] != b['type']: | ||||
blevel += 1 | ||||
secs.append(('', blevel, [])) | ||||
Matt Mackall
|
r15014 | secs[-1][2].append(b) | ||
return secs | ||||
Martin Geisler
|
r9156 | |||
Matt Mackall
|
r15015 | def decorateblocks(blocks, width): | ||
'''generate a list of (section name, line text) pairs for search''' | ||||
lines = [] | ||||
for s in getsections(blocks): | ||||
section = s[0] | ||||
text = formatblocks(s[2], width) | ||||
lines.append([(section, l) for l in text.splitlines(True)]) | ||||
return lines | ||||
Matt Mackall
|
r15039 | |||
def maketable(data, indent=0, header=False): | ||||
Olav Reinert
|
r16815 | '''Generate an RST table for the given table data as a list of lines''' | ||
Matt Mackall
|
r15039 | |||
widths = [max(encoding.colwidth(e) for e in c) for c in zip(*data)] | ||||
indent = ' ' * indent | ||||
div = indent + ' '.join('=' * w for w in widths) + '\n' | ||||
out = [div] | ||||
for row in data: | ||||
Matt Mackall
|
r15144 | l = [] | ||
for w, v in zip(widths, row): | ||||
Simon Heimberg
|
r20654 | if '\n' in v: | ||
# only remove line breaks and indentation, long lines are | ||||
# handled by the next tool | ||||
v = ' '.join(e.lstrip() for e in v.split('\n')) | ||||
Matt Mackall
|
r15144 | pad = ' ' * (w - encoding.colwidth(v)) | ||
l.append(v + pad) | ||||
out.append(indent + ' '.join(l) + "\n") | ||||
Matt Mackall
|
r15039 | if header and len(data) > 1: | ||
out.insert(2, div) | ||||
out.append(div) | ||||
Olav Reinert
|
r16815 | return out | ||