upstream/mercurial-mirror Commit - r9738:f52c4f7a

1

# minirst.py - minimal reStructuredText parser

1

# minirst.py - minimal reStructuredText parser

2

#

2

#

3

4

#

4

#

5

# This software may be used and distributed according to the terms of the

5

# This software may be used and distributed according to the terms of the

6

# GNU General Public License version 2, incorporated herein by reference.

6

# GNU General Public License version 2, incorporated herein by reference.

7

8

"""simplified reStructuredText parser.

8

"""simplified reStructuredText parser.

9

10

This parser knows just enough about reStructuredText to parse the

10

This parser knows just enough about reStructuredText to parse the

11

Mercurial docstrings.

11

Mercurial docstrings.

12

13

It cheats in a major way: nested blocks are not really nested. They

13

It cheats in a major way: nested blocks are not really nested. They

14

are just indented blocks that look like they are nested. This relies

14

are just indented blocks that look like they are nested. This relies

15

on the user to keep the right indentation for the blocks.

15

on the user to keep the right indentation for the blocks.

16

17

It only supports a small subset of reStructuredText:

17

It only supports a small subset of reStructuredText:

18

19

- paragraphs

19

- paragraphs

20

21

- definition lists (must use ' ' to indent definitions)

21

- definition lists (must use ' ' to indent definitions)

22

23

- lists (items must start with '-')

23

- lists (items must start with '-')

24

25

- field lists (colons cannot be escaped)

25

- field lists (colons cannot be escaped)

26

27

- literal blocks

27

- literal blocks

28

29

- option lists (supports only long options without arguments)

29

- option lists (supports only long options without arguments)

30

31

- inline markup is not recognized at all.

31

- inline markup is not recognized at all.

32

"""

32

"""

33

34

import re, sys, textwrap

34

import re, sys, textwrap

35

36

37

def findblocks(text):

37

def findblocks(text):

38

"""Find continuous blocks of lines in text.

38

"""Find continuous blocks of lines in text.

39

40

Returns a list of dictionaries representing the blocks. Each block

40

Returns a list of dictionaries representing the blocks. Each block

41

has an 'indent' field and a 'lines' field.

41

has an 'indent' field and a 'lines' field.

42

"""

42

"""

43

blocks = [[]]

43

blocks = [[]]

44

lines = text.splitlines()

44

lines = text.splitlines()

45

for line in lines:

45

for line in lines:

46

if line.strip():

46

if line.strip():

47

blocks[-1].append(line)

47

blocks[-1].append(line)

48

elif blocks[-1]:

48

elif blocks[-1]:

49

blocks.append([])

49

blocks.append([])

50

if not blocks[-1]:

50

if not blocks[-1]:

51

del blocks[-1]

51

del blocks[-1]

52

53

for i, block in enumerate(blocks):

53

for i, block in enumerate(blocks):

54

indent = min((len(l) - len(l.lstrip())) for l in block)

54

indent = min((len(l) - len(l.lstrip())) for l in block)

55

blocks[i] = dict(indent=indent, lines=[l[indent:] for l in block])

55

blocks[i] = dict(indent=indent, lines=[l[indent:] for l in block])

56

return blocks

56

return blocks

57

58

59

def findliteralblocks(blocks):

59

def findliteralblocks(blocks):

60

"""Finds literal blocks and adds a 'type' field to the blocks.

60

"""Finds literal blocks and adds a 'type' field to the blocks.

61

62

Literal blocks are given the type 'literal', all other blocks are

62

Literal blocks are given the type 'literal', all other blocks are

63

given type the 'paragraph'.

63

given type the 'paragraph'.

64

"""

64

"""

65

i = 0

65

i = 0

66

while i < len(blocks):

66

while i < len(blocks):

67

# Searching for a block that looks like this:

67

# Searching for a block that looks like this:

68

#

68

#

69

# +------------------------------+

69

# +------------------------------+

70

# | paragraph |

70

# | paragraph |

71

# | (ends with "::") |

71

# | (ends with "::") |

72

# +------------------------------+

72

# +------------------------------+

73

# +---------------------------+

73

# +---------------------------+

74

# | indented literal block |

74

# | indented literal block |

75

# +---------------------------+

75

# +---------------------------+

76

blocks[i]['type'] = 'paragraph'

76

blocks[i]['type'] = 'paragraph'

77

if blocks[i]['lines'][-1].endswith('::') and i+1 < len(blocks):

77

if blocks[i]['lines'][-1].endswith('::') and i+1 < len(blocks):

78

indent = blocks[i]['indent']

78

indent = blocks[i]['indent']

79

adjustment = blocks[i+1]['indent'] - indent

79

adjustment = blocks[i+1]['indent'] - indent

80

81

if blocks[i]['lines'] == ['::']:

81

if blocks[i]['lines'] == ['::']:

82

# Expanded form: remove block

82

# Expanded form: remove block

83

del blocks[i]

83

del blocks[i]

84

i -= 1

84

i -= 1

85

elif blocks[i]['lines'][-1].endswith(' ::'):

85

elif blocks[i]['lines'][-1].endswith(' ::'):

86

# Partially minimized form: remove space and both

86

# Partially minimized form: remove space and both

87

# colons.

87

# colons.

88

blocks[i]['lines'][-1] = blocks[i]['lines'][-1][:-3]

88

blocks[i]['lines'][-1] = blocks[i]['lines'][-1][:-3]

89

else:

89

else:

90

# Fully minimized form: remove just one colon.

90

# Fully minimized form: remove just one colon.

91

blocks[i]['lines'][-1] = blocks[i]['lines'][-1][:-1]

91

blocks[i]['lines'][-1] = blocks[i]['lines'][-1][:-1]

92

93

# List items are formatted with a hanging indent. We must

93

# List items are formatted with a hanging indent. We must

94

# correct for this here while we still have the original

94

# correct for this here while we still have the original

95

# information on the indentation of the subsequent literal

95

# information on the indentation of the subsequent literal

96

# blocks available.

96

# blocks available.

97

if blocks[i]['lines'][0].~~startswith~~(~~'- '~~):

97

m = _bulletre.match(blocks[i]['lines'][0])

98

~~indent~~ += 2

98

if m:

99

~~adjustm~~ent -= 2

99

indent += m.end()

100

adjustment -= m.end()

100

101

# Mark the following indented blocks.

102

# Mark the following indented blocks.

102

while i+1 < len(blocks) and blocks[i+1]['indent'] > indent:

103

while i+1 < len(blocks) and blocks[i+1]['indent'] > indent:

103

blocks[i+1]['type'] = 'literal'

104

blocks[i+1]['type'] = 'literal'

104

blocks[i+1]['indent'] -= adjustment

105

blocks[i+1]['indent'] -= adjustment

105

i += 1

106

i += 1

106

i += 1

107

i += 1

107

return blocks

108

return blocks

108

109

_bulletre = re.compile(r'- ')

110

_bulletre = re.compile(r'- ')

110

_optionre = re.compile(r'^(--[a-z-]+)((?:[ =][a-zA-Z][\w-]*)? +)(.*)$')

111

_optionre = re.compile(r'^(--[a-z-]+)((?:[ =][a-zA-Z][\w-]*)? +)(.*)$')

111

_fieldre = re.compile(r':(?![: ])([^:]*)(?<! ):( +)(.*)')

112

_fieldre = re.compile(r':(?![: ])([^:]*)(?<! ):( +)(.*)')

112

_definitionre = re.compile(r'[^ ]')

113

_definitionre = re.compile(r'[^ ]')

113

114

def splitparagraphs(blocks):

115

def splitparagraphs(blocks):

115

"""Split paragraphs into lists."""

116

"""Split paragraphs into lists."""

116

# Tuples with (list type, item regexp, single line items?). Order

117

# Tuples with (list type, item regexp, single line items?). Order

117

# matters: definition lists has the least specific regexp and must

118

# matters: definition lists has the least specific regexp and must

118

# come last.

119

# come last.

119

listtypes = [('bullet', _bulletre, True),

120

listtypes = [('bullet', _bulletre, True),

120

('option', _optionre, True),

121

('option', _optionre, True),

121

('field', _fieldre, True),

122

('field', _fieldre, True),

122

('definition', _definitionre, False)]

123

('definition', _definitionre, False)]

123

124

def match(lines, i, itemre, singleline):

125

def match(lines, i, itemre, singleline):

125

"""Does itemre match an item at line i?

126

"""Does itemre match an item at line i?

126

127

A list item can be followed by an idented line or another list

128

A list item can be followed by an idented line or another list

128

item (but only if singleline is True).

129

item (but only if singleline is True).

129

"""

130

"""

130

line1 = lines[i]

131

line1 = lines[i]

131

line2 = i+1 < len(lines) and lines[i+1] or ''

132

line2 = i+1 < len(lines) and lines[i+1] or ''

132

if not itemre.match(line1):

133

if not itemre.match(line1):

133

return False

134

return False

134

if singleline:

135

if singleline:

135

return line2 == '' or line2[0] == ' ' or itemre.match(line2)

136

return line2 == '' or line2[0] == ' ' or itemre.match(line2)

136

else:

137

else:

137

return line2.startswith(' ')

138

return line2.startswith(' ')

138

139

i = 0

140

i = 0

140

while i < len(blocks):

141

while i < len(blocks):

141

if blocks[i]['type'] == 'paragraph':

142

if blocks[i]['type'] == 'paragraph':

142

lines = blocks[i]['lines']

143

lines = blocks[i]['lines']

143

for type, itemre, singleline in listtypes:

144

for type, itemre, singleline in listtypes:

144

if match(lines, 0, itemre, singleline):

145

if match(lines, 0, itemre, singleline):

145

items = []

146

items = []

146

for j, line in enumerate(lines):

147

for j, line in enumerate(lines):

147

if match(lines, j, itemre, singleline):

148

if match(lines, j, itemre, singleline):

148

items.append(dict(type=type, lines=[],

149

items.append(dict(type=type, lines=[],

149

indent=blocks[i]['indent']))

150

indent=blocks[i]['indent']))

150

items[-1]['lines'].append(line)

151

items[-1]['lines'].append(line)

151

blocks[i:i+1] = items

152

blocks[i:i+1] = items

152

break

153

break

153

i += 1

154

i += 1

154

return blocks

155

return blocks

155

156

157

def findsections(blocks):

158

def findsections(blocks):

158

"""Finds sections.

159

"""Finds sections.

159

160

The blocks must have a 'type' field, i.e., they should have been

161

The blocks must have a 'type' field, i.e., they should have been

161

run through findliteralblocks first.

162

run through findliteralblocks first.

162

"""

163

"""

163

for block in blocks:

164

for block in blocks:

164

# Searching for a block that looks like this:

165

# Searching for a block that looks like this:

165

#

166

#

166

# +------------------------------+

167

# +------------------------------+

167

# | Section title |

168

# | Section title |

168

# | ------------- |

169

# | ------------- |

169

# +------------------------------+

170

# +------------------------------+

170

if (block['type'] == 'paragraph' and

171

if (block['type'] == 'paragraph' and

171

len(block['lines']) == 2 and

172

len(block['lines']) == 2 and

172

block['lines'][1] == '-' * len(block['lines'][0])):

173

block['lines'][1] == '-' * len(block['lines'][0])):

173

block['type'] = 'section'

174

block['type'] = 'section'

174

return blocks

175

return blocks

175

176

177

def inlineliterals(blocks):

178

def inlineliterals(blocks):

178

for b in blocks:

179

for b in blocks:

179

if b['type'] == 'paragraph':

180

if b['type'] == 'paragraph':

180

b['lines'] = [l.replace('``', '"') for l in b['lines']]

181

b['lines'] = [l.replace('``', '"') for l in b['lines']]

181

return blocks

182

return blocks

182

183

184

def addmargins(blocks):

185

def addmargins(blocks):

185

"""Adds empty blocks for vertical spacing.

186

"""Adds empty blocks for vertical spacing.

186

187

This groups bullets, options, and definitions together with no vertical

188

This groups bullets, options, and definitions together with no vertical

188

space between them, and adds an empty block between all other blocks.

189

space between them, and adds an empty block between all other blocks.

189

"""

190

"""

190

i = 1

191

i = 1

191

while i < len(blocks):

192

while i < len(blocks):

192

if (blocks[i]['type'] == blocks[i-1]['type'] and

193

if (blocks[i]['type'] == blocks[i-1]['type'] and

193

blocks[i]['type'] in ('bullet', 'option', 'field', 'definition')):

194

blocks[i]['type'] in ('bullet', 'option', 'field', 'definition')):

194

i += 1

195

i += 1

195

else:

196

else:

196

blocks.insert(i, dict(lines=[''], indent=0, type='margin'))

197

blocks.insert(i, dict(lines=[''], indent=0, type='margin'))

197

i += 2

198

i += 2

198

return blocks

199

return blocks

199

200

201

def formatblock(block, width):

202

def formatblock(block, width):

202

"""Format a block according to width."""

203

"""Format a block according to width."""

203

if width <= 0:

204

if width <= 0:

204

width = 78

205

width = 78

205

indent = ' ' * block['indent']

206

indent = ' ' * block['indent']

206

if block['type'] == 'margin':

207

if block['type'] == 'margin':

207

return ''

208

return ''

208

if block['type'] == 'literal':

209

if block['type'] == 'literal':

209

indent += ' '

210

indent += ' '

210

return indent + ('\n' + indent).join(block['lines'])

211

return indent + ('\n' + indent).join(block['lines'])

211

if block['type'] == 'section':

212

if block['type'] == 'section':

212

return indent + ('\n' + indent).join(block['lines'])

213

return indent + ('\n' + indent).join(block['lines'])

213

if block['type'] == 'definition':

214

if block['type'] == 'definition':

214

term = indent + block['lines'][0]

215

term = indent + block['lines'][0]

215

hang = len(block['lines'][-1]) - len(block['lines'][-1].lstrip())

216

hang = len(block['lines'][-1]) - len(block['lines'][-1].lstrip())

216

defindent = indent + hang * ' '

217

defindent = indent + hang * ' '

217

text = ' '.join(map(str.strip, block['lines'][1:]))

218

text = ' '.join(map(str.strip, block['lines'][1:]))

218

return "%s\n%s" % (term, textwrap.fill(text, width=width,

219

return "%s\n%s" % (term, textwrap.fill(text, width=width,

219

initial_indent=defindent,

220

initial_indent=defindent,

220

subsequent_indent=defindent))

221

subsequent_indent=defindent))

221

initindent = subindent = indent

222

initindent = subindent = indent

222

if block['type'] == 'bullet':

223

if block['type'] == 'bullet':

223

subindent = indent + ' '

224

m = _bulletre.match(block['lines'][0])

225

if m:

226

subindent = indent + m.end() * ' '

224

elif block['type'] == 'field':

227

elif block['type'] == 'field':

225

m = _fieldre.match(block['lines'][0])

228

m = _fieldre.match(block['lines'][0])

226

if m:

229

if m:

227

key, spaces, rest = m.groups()

230

key, spaces, rest = m.groups()

228

# Turn ":foo: bar" into "foo bar".

231

# Turn ":foo: bar" into "foo bar".

229

block['lines'][0] = '%s %s%s' % (key, spaces, rest)

232

block['lines'][0] = '%s %s%s' % (key, spaces, rest)

230

subindent = indent + (2 + len(key) + len(spaces)) * ' '

233

subindent = indent + (2 + len(key) + len(spaces)) * ' '

231

elif block['type'] == 'option':

234

elif block['type'] == 'option':

232

m = _optionre.match(block['lines'][0])

235

m = _optionre.match(block['lines'][0])

233

if m:

236

if m:

234

option, arg, rest = m.groups()

237

option, arg, rest = m.groups()

235

subindent = indent + (len(option) + len(arg)) * ' '

238

subindent = indent + (len(option) + len(arg)) * ' '

236

239

237

text = ' '.join(map(str.strip, block['lines']))

240

text = ' '.join(map(str.strip, block['lines']))

238

return textwrap.fill(text, width=width,

241

return textwrap.fill(text, width=width,

239

initial_indent=initindent,

242

initial_indent=initindent,

240

subsequent_indent=subindent)

243

subsequent_indent=subindent)

241

244

242

245

243

def format(text, width, indent=0):

246

def format(text, width, indent=0):

244

"""Parse and format the text according to width."""

247

"""Parse and format the text according to width."""

245

blocks = findblocks(text)

248

blocks = findblocks(text)

246

for b in blocks:

249

for b in blocks:

247

b['indent'] += indent

250

b['indent'] += indent

248

blocks = findliteralblocks(blocks)

251

blocks = findliteralblocks(blocks)

249

blocks = inlineliterals(blocks)

252

blocks = inlineliterals(blocks)

250

blocks = splitparagraphs(blocks)

253

blocks = splitparagraphs(blocks)

251

blocks = findsections(blocks)

254

blocks = findsections(blocks)

252

blocks = addmargins(blocks)

255

blocks = addmargins(blocks)

253

return '\n'.join(formatblock(b, width) for b in blocks)

256

return '\n'.join(formatblock(b, width) for b in blocks)

254

257

255

258

256

if __name__ == "__main__":

259

if __name__ == "__main__":

257

from pprint import pprint

260

from pprint import pprint

258

261

259

def debug(func, blocks):

262

def debug(func, blocks):

260

blocks = func(blocks)

263

blocks = func(blocks)

261

print "*** after %s:" % func.__name__

264

print "*** after %s:" % func.__name__

262

pprint(blocks)

265

pprint(blocks)

263

print

266

print

264

return blocks

267

return blocks

265

268

266

text = open(sys.argv[1]).read()

269

text = open(sys.argv[1]).read()

267

blocks = debug(findblocks, text)

270

blocks = debug(findblocks, text)

268

blocks = debug(findliteralblocks, blocks)

271

blocks = debug(findliteralblocks, blocks)

269

blocks = debug(splitparagraphs, blocks)

272

blocks = debug(splitparagraphs, blocks)

270

blocks = debug(findsections, blocks)

273

blocks = debug(findsections, blocks)

271

blocks = debug(addmargins, blocks)

274

blocks = debug(addmargins, blocks)

272

print '\n'.join(formatblock(b, 30) for b in blocks)

275

print '\n'.join(formatblock(b, 30) for b in blocks)

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages

             # minirst.py - minimal reStructuredText parser
             #
             # Copyright 2009 Matt Mackall <mpm@selenic.com> and others
             #
             # This software may be used and distributed according to the terms of the
             # GNU General Public License version 2, incorporated herein by reference.
             """simplified reStructuredText parser.
             This parser knows just enough about reStructuredText to parse the
             Mercurial docstrings.
             It cheats in a major way: nested blocks are not really nested. They
             are just indented blocks that look like they are nested. This relies
             on the user to keep the right indentation for the blocks.
             It only supports a small subset of reStructuredText:
             - paragraphs
             - definition lists (must use '  ' to indent definitions)
             - lists (items must start with '-')
             - field lists (colons cannot be escaped)
             - literal blocks
             - option lists (supports only long options without arguments)
             - inline markup is not recognized at all.
             """
             import re, sys, textwrap
             def findblocks(text):
                 """Find continuous blocks of lines in text.
                 Returns a list of dictionaries representing the blocks. Each block
                 has an 'indent' field and a 'lines' field.
                 """
                 blocks = [[]]
                 lines = text.splitlines()
                 for line in lines:
                     if line.strip():
                         blocks[-1].append(line)
                     elif blocks[-1]:
                         blocks.append([])
                 if not blocks[-1]:
                     del blocks[-1]
                 for i, block in enumerate(blocks):
                     indent = min((len(l) - len(l.lstrip())) for l in block)
                     blocks[i] = dict(indent=indent, lines=[l[indent:] for l in block])
                 return blocks
             def findliteralblocks(blocks):
                 """Finds literal blocks and adds a 'type' field to the blocks.
                 Literal blocks are given the type 'literal', all other blocks are
                 given type the 'paragraph'.
                 """
                 i = 0
                 while i < len(blocks):
                     # Searching for a block that looks like this:
                     #
                     # +------------------------------+
                     # | paragraph                    |
                     # | (ends with "::")             |
                     # +------------------------------+
                     #    +---------------------------+
                     #    | indented literal block    |
                     #    +---------------------------+
                     blocks[i]['type'] = 'paragraph'
                     if blocks[i]['lines'][-1].endswith('::') and i+1 < len(blocks):
                         indent = blocks[i]['indent']
                         adjustment = blocks[i+1]['indent'] - indent
                         if blocks[i]['lines'] == ['::']:
                             # Expanded form: remove block
                             del blocks[i]
                             i -= 1
                         elif blocks[i]['lines'][-1].endswith(' ::'):
                             # Partially minimized form: remove space and both
                             # colons.
                             blocks[i]['lines'][-1] = blocks[i]['lines'][-1][:-3]
                         else:
                             # Fully minimized form: remove just one colon.
                             blocks[i]['lines'][-1] = blocks[i]['lines'][-1][:-1]
                         # List items are formatted with a hanging indent. We must
                         # correct for this here while we still have the original
                         # information on the indentation of the subsequent literal
                         # blocks available.
-                        if blocks[i]['lines'][0].startswith('- '):
+                        m = _bulletre.match(blocks[i]['lines'][0])
-                            indent += 2
+                        if m:
-                            adjustment -= 2
+                            indent += m.end()
+                            adjustment -= m.end()
                         # Mark the following indented blocks.
                         while i+1 < len(blocks) and blocks[i+1]['indent'] > indent:
                             blocks[i+1]['type'] = 'literal'
                             blocks[i+1]['indent'] -= adjustment
                             i += 1
                     i += 1
                 return blocks
             _bulletre = re.compile(r'- ')
             _optionre = re.compile(r'^(--[a-z-]+)((?:[ =][a-zA-Z][\w-]*)?  +)(.*)$')
             _fieldre = re.compile(r':(?![: ])([^:]*)(?<! ):( +)(.*)')
             _definitionre = re.compile(r'[^ ]')
             def splitparagraphs(blocks):
                 """Split paragraphs into lists."""
                 # Tuples with (list type, item regexp, single line items?). Order
                 # matters: definition lists has the least specific regexp and must
                 # come last.
                 listtypes = [('bullet', _bulletre, True),
                              ('option', _optionre, True),
                              ('field', _fieldre, True),
                              ('definition', _definitionre, False)]
                 def match(lines, i, itemre, singleline):
                     """Does itemre match an item at line i?
                     A list item can be followed by an idented line or another list
                     item (but only if singleline is True).
                     """
                     line1 = lines[i]
                     line2 = i+1 < len(lines) and lines[i+1] or ''
                     if not itemre.match(line1):
                         return False
                     if singleline:
                         return line2 == '' or line2[0] == ' ' or itemre.match(line2)
                     else:
                         return line2.startswith(' ')
                 i = 0
                 while i < len(blocks):
                     if blocks[i]['type'] == 'paragraph':
                         lines = blocks[i]['lines']
                         for type, itemre, singleline in listtypes:
                             if match(lines, 0, itemre, singleline):
                                 items = []
                                 for j, line in enumerate(lines):
                                     if match(lines, j, itemre, singleline):
                                         items.append(dict(type=type, lines=[],
                                                           indent=blocks[i]['indent']))
                                     items[-1]['lines'].append(line)
                                 blocks[i:i+1] = items
                                 break
                     i += 1
                 return blocks
             def findsections(blocks):
                 """Finds sections.
                 The blocks must have a 'type' field, i.e., they should have been
                 run through findliteralblocks first.
                 """
                 for block in blocks:
                     # Searching for a block that looks like this:
                     #
                     # +------------------------------+
                     # | Section title                |
                     # | -------------                |
                     # +------------------------------+
                     if (block['type'] == 'paragraph' and
                         len(block['lines']) == 2 and
                         block['lines'][1] == '-' * len(block['lines'][0])):
                         block['type'] = 'section'
                 return blocks
             def inlineliterals(blocks):
                 for b in blocks:
                     if b['type'] == 'paragraph':
                         b['lines'] = [l.replace('``', '"') for l in b['lines']]
                 return blocks
             def addmargins(blocks):
                 """Adds empty blocks for vertical spacing.
                 This groups bullets, options, and definitions together with no vertical
                 space between them, and adds an empty block between all other blocks.
                 """
                 i = 1
                 while i < len(blocks):
                     if (blocks[i]['type'] == blocks[i-1]['type'] and
                         blocks[i]['type'] in ('bullet', 'option', 'field', 'definition')):
                         i += 1
                     else:
                         blocks.insert(i, dict(lines=[''], indent=0, type='margin'))
                         i += 2
                 return blocks
             def formatblock(block, width):
                 """Format a block according to width."""
                 if width <= 0:
                     width = 78
                 indent = ' ' * block['indent']
                 if block['type'] == 'margin':
                     return ''
                 if block['type'] == 'literal':
                     indent += '  '
                     return indent + ('\n' + indent).join(block['lines'])
                 if block['type'] == 'section':
                     return indent + ('\n' + indent).join(block['lines'])
                 if block['type'] == 'definition':
                     term = indent + block['lines'][0]
                     hang = len(block['lines'][-1]) - len(block['lines'][-1].lstrip())
                     defindent = indent + hang * ' '
                     text = ' '.join(map(str.strip, block['lines'][1:]))
                     return "%s\n%s" % (term, textwrap.fill(text, width=width,
                                                            initial_indent=defindent,
                                                            subsequent_indent=defindent))
                 initindent = subindent = indent
                 if block['type'] == 'bullet':
-                    subindent = indent + '  '
+                    m = _bulletre.match(block['lines'][0])
+                    if m:
+                        subindent = indent + m.end() * ' '
                 elif block['type'] == 'field':
                     m = _fieldre.match(block['lines'][0])
                     if m:
                         key, spaces, rest = m.groups()
                         # Turn ":foo: bar" into "foo   bar".
                         block['lines'][0] = '%s  %s%s' % (key, spaces, rest)
                         subindent = indent + (2 + len(key) + len(spaces)) * ' '
                 elif block['type'] == 'option':
                     m = _optionre.match(block['lines'][0])
                     if m:
                         option, arg, rest = m.groups()
                         subindent = indent + (len(option) + len(arg)) * ' '
                 text = ' '.join(map(str.strip, block['lines']))
                 return textwrap.fill(text, width=width,
                                      initial_indent=initindent,
                                      subsequent_indent=subindent)
             def format(text, width, indent=0):
                 """Parse and format the text according to width."""
                 blocks = findblocks(text)
                 for b in blocks:
                     b['indent'] += indent
                 blocks = findliteralblocks(blocks)
                 blocks = inlineliterals(blocks)
                 blocks = splitparagraphs(blocks)
                 blocks = findsections(blocks)
                 blocks = addmargins(blocks)
                 return '\n'.join(formatblock(b, width) for b in blocks)
             if __name__ == "__main__":
                 from pprint import pprint
                 def debug(func, blocks):
                     blocks = func(blocks)
                     print "*** after %s:" % func.__name__
                     pprint(blocks)
                     print
                     return blocks
                 text = open(sys.argv[1]).read()
                 blocks = debug(findblocks, text)
                 blocks = debug(findliteralblocks, blocks)
                 blocks = debug(splitparagraphs, blocks)
                 blocks = debug(findsections, blocks)
                 blocks = debug(addmargins, blocks)
                 print '\n'.join(formatblock(b, 30) for b in blocks)