upstream/mercurial-mirror Commit - r39087:38409be2

1

# stringutil.py - utility for generic string formatting, parsing, etc.

1

# stringutil.py - utility for generic string formatting, parsing, etc.

2

#

2

#

3

4

5

6

#

6

#

7

# This software may be used and distributed according to the terms of the

7

# This software may be used and distributed according to the terms of the

8

# GNU General Public License version 2 or any later version.

8

# GNU General Public License version 2 or any later version.

9

10

from __future__ import absolute_import

10

from __future__ import absolute_import

11

12

import ast

12

import ast

13

import codecs

13

import codecs

14

import re as remod

14

import re as remod

15

import textwrap

15

import textwrap

16

17

from ..i18n import _

17

from ..i18n import _

18

from ..thirdparty import attr

18

from ..thirdparty import attr

19

20

from .. import (

20

from .. import (

21

encoding,

21

encoding,

22

error,

22

error,

23

pycompat,

23

pycompat,

24

)

24

)

25

26

# regex special chars pulled from https://bugs.python.org/issue29995

26

# regex special chars pulled from https://bugs.python.org/issue29995

27

# which was part of Python 3.7.

27

# which was part of Python 3.7.

28

_respecial = pycompat.bytestr(b'()[]{}?*+-|^$\\.&~# \t\n\r\v\f')

28

_respecial = pycompat.bytestr(b'()[]{}?*+-|^$\\.&~# \t\n\r\v\f')

29

_regexescapemap = {ord(i): (b'\\' + i).decode('latin1') for i in _respecial}

29

_regexescapemap = {ord(i): (b'\\' + i).decode('latin1') for i in _respecial}

30

31

def reescape(pat):

31

def reescape(pat):

32

"""Drop-in replacement for re.escape."""

32

"""Drop-in replacement for re.escape."""

33

# NOTE: it is intentional that this works on unicodes and not

33

# NOTE: it is intentional that this works on unicodes and not

34

# bytes, as it's only possible to do the escaping with

34

# bytes, as it's only possible to do the escaping with

35

# unicode.translate, not bytes.translate. Sigh.

35

# unicode.translate, not bytes.translate. Sigh.

36

wantuni = True

36

wantuni = True

37

if isinstance(pat, bytes):

37

if isinstance(pat, bytes):

38

wantuni = False

38

wantuni = False

39

pat = pat.decode('latin1')

39

pat = pat.decode('latin1')

40

pat = pat.translate(_regexescapemap)

40

pat = pat.translate(_regexescapemap)

41

if wantuni:

41

if wantuni:

42

return pat

42

return pat

43

return pat.encode('latin1')

43

return pat.encode('latin1')

44

45

def pprint(o, bprefix=False):

45

def pprint(o, bprefix=False):

46

"""Pretty print an object."""

46

"""Pretty print an object."""

47

if isinstance(o, bytes):

47

if isinstance(o, bytes):

48

if bprefix:

48

if bprefix:

49

return "b'%s'" % escapestr(o)

49

return "b'%s'" % escapestr(o)

50

return "'%s'" % escapestr(o)

50

return "'%s'" % escapestr(o)

51

elif isinstance(o, bytearray):

51

elif isinstance(o, bytearray):

52

# codecs.escape_encode() can't handle bytearray, so escapestr fails

52

# codecs.escape_encode() can't handle bytearray, so escapestr fails

53

# without coercion.

53

# without coercion.

54

return "bytearray['%s']" % escapestr(bytes(o))

54

return "bytearray['%s']" % escapestr(bytes(o))

55

elif isinstance(o, list):

55

elif isinstance(o, list):

56

return '[%s]' % (b', '.join(pprint(a, bprefix=bprefix) for a in o))

56

return '[%s]' % (b', '.join(pprint(a, bprefix=bprefix) for a in o))

57

elif isinstance(o, dict):

57

elif isinstance(o, dict):

58

return '{%s}' % (b', '.join(

58

return '{%s}' % (b', '.join(

59

'%s: %s' % (pprint(k, bprefix=bprefix),

59

'%s: %s' % (pprint(k, bprefix=bprefix),

60

pprint(v, bprefix=bprefix))

60

pprint(v, bprefix=bprefix))

61

for k, v in sorted(o.items())))

61

for k, v in sorted(o.items())))

62

elif isinstance(o, set):

62

elif isinstance(o, set):

63

return 'set([%s])' % (b', '.join(

63

return 'set([%s])' % (b', '.join(

64

pprint(k, bprefix=bprefix) for k in sorted(o)))

64

pprint(k, bprefix=bprefix) for k in sorted(o)))

65

elif isinstance(o, tuple):

65

elif isinstance(o, tuple):

66

return '(%s)' % (b', '.join(pprint(a, bprefix=bprefix) for a in o))

66

return '(%s)' % (b', '.join(pprint(a, bprefix=bprefix) for a in o))

67

else:

67

else:

68

return pycompat.byterepr(o)

68

return pycompat.byterepr(o)

69

70

def prettyrepr(o):

70

def prettyrepr(o):

71

"""Pretty print a representation of a possibly-nested object"""

71

"""Pretty print a representation of a possibly-nested object"""

72

lines = []

72

lines = []

73

rs = pycompat.byterepr(o)

73

rs = pycompat.byterepr(o)

74

p0 = p1 = 0

74

p0 = p1 = 0

75

while p0 < len(rs):

75

while p0 < len(rs):

76

# '... field=<type ... field=<type ...'

76

# '... field=<type ... field=<type ...'

77

# ~~~~~~~~~~~~~~~~

77

# ~~~~~~~~~~~~~~~~

78

# p0 p1 q0 q1

78

# p0 p1 q0 q1

79

q0 = -1

79

q0 = -1

80

q1 = rs.find('<', p1 + 1)

80

q1 = rs.find('<', p1 + 1)

81

if q1 < 0:

81

if q1 < 0:

82

q1 = len(rs)

82

q1 = len(rs)

83

elif q1 > p1 + 1 and rs.startswith('=', q1 - 1):

83

elif q1 > p1 + 1 and rs.startswith('=', q1 - 1):

84

# backtrack for ' field=<'

84

# backtrack for ' field=<'

85

q0 = rs.rfind(' ', p1 + 1, q1 - 1)

85

q0 = rs.rfind(' ', p1 + 1, q1 - 1)

86

if q0 < 0:

86

if q0 < 0:

87

q0 = q1

87

q0 = q1

88

else:

88

else:

89

q0 += 1 # skip ' '

89

q0 += 1 # skip ' '

90

l = rs.count('<', 0, p0) - rs.count('>', 0, p0)

90

l = rs.count('<', 0, p0) - rs.count('>', 0, p0)

91

assert l >= 0

91

assert l >= 0

92

lines.append((l, rs[p0:q0].rstrip()))

92

lines.append((l, rs[p0:q0].rstrip()))

93

p0, p1 = q0, q1

93

p0, p1 = q0, q1

94

return '\n'.join(' ' * l + s for l, s in lines)

94

return '\n'.join(' ' * l + s for l, s in lines)

95

96

def buildrepr(r):

96

def buildrepr(r):

97

"""Format an optional printable representation from unexpanded bits

97

"""Format an optional printable representation from unexpanded bits

98

99

======== =================================

99

======== =================================

100

type(r) example

100

type(r) example

101

======== =================================

101

======== =================================

102

tuple ('<not %r>', other)

102

tuple ('<not %r>', other)

103

bytes '<branch closed>'

103

bytes '<branch closed>'

104

callable lambda: '<branch %r>' % sorted(b)

104

callable lambda: '<branch %r>' % sorted(b)

105

object other

105

object other

106

======== =================================

106

======== =================================

107

"""

107

"""

108

if r is None:

108

if r is None:

109

return ''

109

return ''

110

elif isinstance(r, tuple):

110

elif isinstance(r, tuple):

111

return r[0] % pycompat.rapply(pycompat.maybebytestr, r[1:])

111

return r[0] % pycompat.rapply(pycompat.maybebytestr, r[1:])

112

elif isinstance(r, bytes):

112

elif isinstance(r, bytes):

113

return r

113

return r

114

elif callable(r):

114

elif callable(r):

115

return r()

115

return r()

116

else:

116

else:

117

return p~~ycompat~~.~~byterepr~~(r)

117

return pprint(r)

118

119

def binary(s):

119

def binary(s):

120

"""return true if a string is binary data"""

120

"""return true if a string is binary data"""

121

return bool(s and '\0' in s)

121

return bool(s and '\0' in s)

122

123

def stringmatcher(pattern, casesensitive=True):

123

def stringmatcher(pattern, casesensitive=True):

124

"""

124

"""

125

accepts a string, possibly starting with 're:' or 'literal:' prefix.

125

accepts a string, possibly starting with 're:' or 'literal:' prefix.

126

returns the matcher name, pattern, and matcher function.

126

returns the matcher name, pattern, and matcher function.

127

missing or unknown prefixes are treated as literal matches.

127

missing or unknown prefixes are treated as literal matches.

128

129

helper for tests:

129

helper for tests:

130

>>> def test(pattern, *tests):

130

>>> def test(pattern, *tests):

131

... kind, pattern, matcher = stringmatcher(pattern)

131

... kind, pattern, matcher = stringmatcher(pattern)

132

... return (kind, pattern, [bool(matcher(t)) for t in tests])

132

... return (kind, pattern, [bool(matcher(t)) for t in tests])

133

>>> def itest(pattern, *tests):

133

>>> def itest(pattern, *tests):

134

... kind, pattern, matcher = stringmatcher(pattern, casesensitive=False)

134

... kind, pattern, matcher = stringmatcher(pattern, casesensitive=False)

135

... return (kind, pattern, [bool(matcher(t)) for t in tests])

135

... return (kind, pattern, [bool(matcher(t)) for t in tests])

136

137

exact matching (no prefix):

137

exact matching (no prefix):

138

>>> test(b'abcdefg', b'abc', b'def', b'abcdefg')

138

>>> test(b'abcdefg', b'abc', b'def', b'abcdefg')

139

('literal', 'abcdefg', [False, False, True])

139

('literal', 'abcdefg', [False, False, True])

140

141

regex matching ('re:' prefix)

141

regex matching ('re:' prefix)

142

>>> test(b're:a.+b', b'nomatch', b'fooadef', b'fooadefbar')

142

>>> test(b're:a.+b', b'nomatch', b'fooadef', b'fooadefbar')

143

('re', 'a.+b', [False, False, True])

143

('re', 'a.+b', [False, False, True])

144

145

force exact matches ('literal:' prefix)

145

force exact matches ('literal:' prefix)

146

>>> test(b'literal:re:foobar', b'foobar', b're:foobar')

146

>>> test(b'literal:re:foobar', b'foobar', b're:foobar')

147

('literal', 're:foobar', [False, True])

147

('literal', 're:foobar', [False, True])

148

149

unknown prefixes are ignored and treated as literals

149

unknown prefixes are ignored and treated as literals

150

>>> test(b'foo:bar', b'foo', b'bar', b'foo:bar')

150

>>> test(b'foo:bar', b'foo', b'bar', b'foo:bar')

151

('literal', 'foo:bar', [False, False, True])

151

('literal', 'foo:bar', [False, False, True])

152

153

case insensitive regex matches

153

case insensitive regex matches

154

>>> itest(b're:A.+b', b'nomatch', b'fooadef', b'fooadefBar')

154

>>> itest(b're:A.+b', b'nomatch', b'fooadef', b'fooadefBar')

155

('re', 'A.+b', [False, False, True])

155

('re', 'A.+b', [False, False, True])

156

157

case insensitive literal matches

157

case insensitive literal matches

158

>>> itest(b'ABCDEFG', b'abc', b'def', b'abcdefg')

158

>>> itest(b'ABCDEFG', b'abc', b'def', b'abcdefg')

159

('literal', 'ABCDEFG', [False, False, True])

159

('literal', 'ABCDEFG', [False, False, True])

160

"""

160

"""

161

if pattern.startswith('re:'):

161

if pattern.startswith('re:'):

162

pattern = pattern[3:]

162

pattern = pattern[3:]

163

try:

163

try:

164

flags = 0

164

flags = 0

165

if not casesensitive:

165

if not casesensitive:

166

flags = remod.I

166

flags = remod.I

167

regex = remod.compile(pattern, flags)

167

regex = remod.compile(pattern, flags)

168

except remod.error as e:

168

except remod.error as e:

169

raise error.ParseError(_('invalid regular expression: %s')

169

raise error.ParseError(_('invalid regular expression: %s')

170

% e)

170

% e)

171

return 're', pattern, regex.search

171

return 're', pattern, regex.search

172

elif pattern.startswith('literal:'):

172

elif pattern.startswith('literal:'):

173

pattern = pattern[8:]

173

pattern = pattern[8:]

174

175

match = pattern.__eq__

175

match = pattern.__eq__

176

177

if not casesensitive:

177

if not casesensitive:

178

ipat = encoding.lower(pattern)

178

ipat = encoding.lower(pattern)

179

match = lambda s: ipat == encoding.lower(s)

179

match = lambda s: ipat == encoding.lower(s)

180

return 'literal', pattern, match

180

return 'literal', pattern, match

181

182

def shortuser(user):

182

def shortuser(user):

183

"""Return a short representation of a user name or email address."""

183

"""Return a short representation of a user name or email address."""

184

f = user.find('@')

184

f = user.find('@')

185

if f >= 0:

185

if f >= 0:

186

user = user[:f]

186

user = user[:f]

187

f = user.find('<')

187

f = user.find('<')

188

if f >= 0:

188

if f >= 0:

189

user = user[f + 1:]

189

user = user[f + 1:]

190

f = user.find(' ')

190

f = user.find(' ')

191

if f >= 0:

191

if f >= 0:

192

user = user[:f]

192

user = user[:f]

193

f = user.find('.')

193

f = user.find('.')

194

if f >= 0:

194

if f >= 0:

195

user = user[:f]

195

user = user[:f]

196

return user

196

return user

197

198

def emailuser(user):

198

def emailuser(user):

199

"""Return the user portion of an email address."""

199

"""Return the user portion of an email address."""

200

f = user.find('@')

200

f = user.find('@')

201

if f >= 0:

201

if f >= 0:

202

user = user[:f]

202

user = user[:f]

203

f = user.find('<')

203

f = user.find('<')

204

if f >= 0:

204

if f >= 0:

205

user = user[f + 1:]

205

user = user[f + 1:]

206

return user

206

return user

207

208

def email(author):

208

def email(author):

209

'''get email of author.'''

209

'''get email of author.'''

210

r = author.find('>')

210

r = author.find('>')

211

if r == -1:

211

if r == -1:

212

r = None

212

r = None

213

return author[author.find('<') + 1:r]

213

return author[author.find('<') + 1:r]

214

215

def person(author):

215

def person(author):

216

"""Returns the name before an email address,

216

"""Returns the name before an email address,

217

interpreting it as per RFC 5322

217

interpreting it as per RFC 5322

218

219

>>> person(b'foo@bar')

219

>>> person(b'foo@bar')

220

'foo'

220

'foo'

221

>>> person(b'Foo Bar <foo@bar>')

221

>>> person(b'Foo Bar <foo@bar>')

222

'Foo Bar'

222

'Foo Bar'

223

>>> person(b'"Foo Bar" <foo@bar>')

223

>>> person(b'"Foo Bar" <foo@bar>')

224

'Foo Bar'

224

'Foo Bar'

225

>>> person(b'"Foo \"buz\" Bar" <foo@bar>')

225

>>> person(b'"Foo \"buz\" Bar" <foo@bar>')

226

'Foo "buz" Bar'

226

'Foo "buz" Bar'

227

>>> # The following are invalid, but do exist in real-life

227

>>> # The following are invalid, but do exist in real-life

228

...

228

...

229

>>> person(b'Foo "buz" Bar <foo@bar>')

229

>>> person(b'Foo "buz" Bar <foo@bar>')

230

'Foo "buz" Bar'

230

'Foo "buz" Bar'

231

>>> person(b'"Foo Bar <foo@bar>')

231

>>> person(b'"Foo Bar <foo@bar>')

232

'Foo Bar'

232

'Foo Bar'

233

"""

233

"""

234

if '@' not in author:

234

if '@' not in author:

235

return author

235

return author

236

f = author.find('<')

236

f = author.find('<')

237

if f != -1:

237

if f != -1:

238

return author[:f].strip(' "').replace('\\"', '"')

238

return author[:f].strip(' "').replace('\\"', '"')

239

f = author.find('@')

239

f = author.find('@')

240

return author[:f].replace('.', ' ')

240

return author[:f].replace('.', ' ')

241

242

@attr.s(hash=True)

242

@attr.s(hash=True)

243

class mailmapping(object):

243

class mailmapping(object):

244

'''Represents a username/email key or value in

244

'''Represents a username/email key or value in

245

a mailmap file'''

245

a mailmap file'''

246

email = attr.ib()

246

email = attr.ib()

247

name = attr.ib(default=None)

247

name = attr.ib(default=None)

248

249

def _ismailmaplineinvalid(names, emails):

249

def _ismailmaplineinvalid(names, emails):

250

'''Returns True if the parsed names and emails

250

'''Returns True if the parsed names and emails

251

in a mailmap entry are invalid.

251

in a mailmap entry are invalid.

252

253

>>> # No names or emails fails

253

>>> # No names or emails fails

254

>>> names, emails = [], []

254

>>> names, emails = [], []

255

>>> _ismailmaplineinvalid(names, emails)

255

>>> _ismailmaplineinvalid(names, emails)

256

True

256

True

257

>>> # Only one email fails

257

>>> # Only one email fails

258

>>> emails = [b'email@email.com']

258

>>> emails = [b'email@email.com']

259

>>> _ismailmaplineinvalid(names, emails)

259

>>> _ismailmaplineinvalid(names, emails)

260

True

260

True

261

>>> # One email and one name passes

261

>>> # One email and one name passes

262

>>> names = [b'Test Name']

262

>>> names = [b'Test Name']

263

>>> _ismailmaplineinvalid(names, emails)

263

>>> _ismailmaplineinvalid(names, emails)

264

False

264

False

265

>>> # No names but two emails passes

265

>>> # No names but two emails passes

266

>>> names = []

266

>>> names = []

267

>>> emails = [b'proper@email.com', b'commit@email.com']

267

>>> emails = [b'proper@email.com', b'commit@email.com']

268

>>> _ismailmaplineinvalid(names, emails)

268

>>> _ismailmaplineinvalid(names, emails)

269

False

269

False

270

'''

270

'''

271

return not emails or not names and len(emails) < 2

271

return not emails or not names and len(emails) < 2

272

273

def parsemailmap(mailmapcontent):

273

def parsemailmap(mailmapcontent):

274

"""Parses data in the .mailmap format

274

"""Parses data in the .mailmap format

275

276

>>> mmdata = b"\\n".join([

276

>>> mmdata = b"\\n".join([

277

... b'# Comment',

277

... b'# Comment',

278

... b'Name <commit1@email.xx>',

278

... b'Name <commit1@email.xx>',

279

... b'<name@email.xx> <commit2@email.xx>',

279

... b'<name@email.xx> <commit2@email.xx>',

280

... b'Name <proper@email.xx> <commit3@email.xx>',

280

... b'Name <proper@email.xx> <commit3@email.xx>',

281

... b'Name <proper@email.xx> Commit <commit4@email.xx>',

281

... b'Name <proper@email.xx> Commit <commit4@email.xx>',

282

... ])

282

... ])

283

>>> mm = parsemailmap(mmdata)

283

>>> mm = parsemailmap(mmdata)

284

>>> for key in sorted(mm.keys()):

284

>>> for key in sorted(mm.keys()):

285

... print(key)

285

... print(key)

286

mailmapping(email='commit1@email.xx', name=None)

286

mailmapping(email='commit1@email.xx', name=None)

287

mailmapping(email='commit2@email.xx', name=None)

287

mailmapping(email='commit2@email.xx', name=None)

288

mailmapping(email='commit3@email.xx', name=None)

288

mailmapping(email='commit3@email.xx', name=None)

289

mailmapping(email='commit4@email.xx', name='Commit')

289

mailmapping(email='commit4@email.xx', name='Commit')

290

>>> for val in sorted(mm.values()):

290

>>> for val in sorted(mm.values()):

291

... print(val)

291

... print(val)

292

mailmapping(email='commit1@email.xx', name='Name')

292

mailmapping(email='commit1@email.xx', name='Name')

293

mailmapping(email='name@email.xx', name=None)

293

mailmapping(email='name@email.xx', name=None)

294

mailmapping(email='proper@email.xx', name='Name')

294

mailmapping(email='proper@email.xx', name='Name')

295

mailmapping(email='proper@email.xx', name='Name')

295

mailmapping(email='proper@email.xx', name='Name')

296

"""

296

"""

297

mailmap = {}

297

mailmap = {}

298

299

if mailmapcontent is None:

299

if mailmapcontent is None:

300

return mailmap

300

return mailmap

301

302

for line in mailmapcontent.splitlines():

302

for line in mailmapcontent.splitlines():

303

304

# Don't bother checking the line if it is a comment or

304

# Don't bother checking the line if it is a comment or

305

# is an improperly formed author field

305

# is an improperly formed author field

306

if line.lstrip().startswith('#'):

306

if line.lstrip().startswith('#'):

307

continue

307

continue

308

309

# names, emails hold the parsed emails and names for each line

309

# names, emails hold the parsed emails and names for each line

310

# name_builder holds the words in a persons name

310

# name_builder holds the words in a persons name

311

names, emails = [], []

311

names, emails = [], []

312

namebuilder = []

312

namebuilder = []

313

314

for element in line.split():

314

for element in line.split():

315

if element.startswith('#'):

315

if element.startswith('#'):

316

# If we reach a comment in the mailmap file, move on

316

# If we reach a comment in the mailmap file, move on

317

break

317

break

318

319

elif element.startswith('<') and element.endswith('>'):

319

elif element.startswith('<') and element.endswith('>'):

320

# We have found an email.

320

# We have found an email.

321

# Parse it, and finalize any names from earlier

321

# Parse it, and finalize any names from earlier

322

emails.append(element[1:-1]) # Slice off the "<>"

322

emails.append(element[1:-1]) # Slice off the "<>"

323

324

if namebuilder:

324

if namebuilder:

325

names.append(' '.join(namebuilder))

325

names.append(' '.join(namebuilder))

326

namebuilder = []

326

namebuilder = []

327

328

# Break if we have found a second email, any other

328

# Break if we have found a second email, any other

329

# data does not fit the spec for .mailmap

329

# data does not fit the spec for .mailmap

330

if len(emails) > 1:

330

if len(emails) > 1:

331

break

331

break

332

333

else:

333

else:

334

# We have found another word in the committers name

334

# We have found another word in the committers name

335

namebuilder.append(element)

335

namebuilder.append(element)

336

337

# Check to see if we have parsed the line into a valid form

337

# Check to see if we have parsed the line into a valid form

338

# We require at least one email, and either at least one

338

# We require at least one email, and either at least one

339

# name or a second email

339

# name or a second email

340

if _ismailmaplineinvalid(names, emails):

340

if _ismailmaplineinvalid(names, emails):

341

continue

341

continue

342

343

mailmapkey = mailmapping(

343

mailmapkey = mailmapping(

344

email=emails[-1],

344

email=emails[-1],

345

name=names[-1] if len(names) == 2 else None,

345

name=names[-1] if len(names) == 2 else None,

346

)

346

)

347

348

mailmap[mailmapkey] = mailmapping(

348

mailmap[mailmapkey] = mailmapping(

349

email=emails[0],

349

email=emails[0],

350

name=names[0] if names else None,

350

name=names[0] if names else None,

351

)

351

)

352

353

return mailmap

353

return mailmap

354

355

def mapname(mailmap, author):

355

def mapname(mailmap, author):

356

"""Returns the author field according to the mailmap cache, or

356

"""Returns the author field according to the mailmap cache, or

357

the original author field.

357

the original author field.

358

359

>>> mmdata = b"\\n".join([

359

>>> mmdata = b"\\n".join([

360

... b'# Comment',

360

... b'# Comment',

361

... b'Name <commit1@email.xx>',

361

... b'Name <commit1@email.xx>',

362

... b'<name@email.xx> <commit2@email.xx>',

362

... b'<name@email.xx> <commit2@email.xx>',

363

... b'Name <proper@email.xx> <commit3@email.xx>',

363

... b'Name <proper@email.xx> <commit3@email.xx>',

364

... b'Name <proper@email.xx> Commit <commit4@email.xx>',

364

... b'Name <proper@email.xx> Commit <commit4@email.xx>',

365

... ])

365

... ])

366

>>> m = parsemailmap(mmdata)

366

>>> m = parsemailmap(mmdata)

367

>>> mapname(m, b'Commit <commit1@email.xx>')

367

>>> mapname(m, b'Commit <commit1@email.xx>')

368

'Name <commit1@email.xx>'

368

'Name <commit1@email.xx>'

369

>>> mapname(m, b'Name <commit2@email.xx>')

369

>>> mapname(m, b'Name <commit2@email.xx>')

370

'Name <name@email.xx>'

370

'Name <name@email.xx>'

371

>>> mapname(m, b'Commit <commit3@email.xx>')

371

>>> mapname(m, b'Commit <commit3@email.xx>')

372

'Name <proper@email.xx>'

372

'Name <proper@email.xx>'

373

>>> mapname(m, b'Commit <commit4@email.xx>')

373

>>> mapname(m, b'Commit <commit4@email.xx>')

374

'Name <proper@email.xx>'

374

'Name <proper@email.xx>'

375

>>> mapname(m, b'Unknown Name <unknown@email.com>')

375

>>> mapname(m, b'Unknown Name <unknown@email.com>')

376

'Unknown Name <unknown@email.com>'

376

'Unknown Name <unknown@email.com>'

377

"""

377

"""

378

# If the author field coming in isn't in the correct format,

378

# If the author field coming in isn't in the correct format,

379

# or the mailmap is empty just return the original author field

379

# or the mailmap is empty just return the original author field

380

if not isauthorwellformed(author) or not mailmap:

380

if not isauthorwellformed(author) or not mailmap:

381

return author

381

return author

382

383

# Turn the user name into a mailmapping

383

# Turn the user name into a mailmapping

384

commit = mailmapping(name=person(author), email=email(author))

384

commit = mailmapping(name=person(author), email=email(author))

385

386

try:

386

try:

387

# Try and use both the commit email and name as the key

387

# Try and use both the commit email and name as the key

388

proper = mailmap[commit]

388

proper = mailmap[commit]

389

390

except KeyError:

390

except KeyError:

391

# If the lookup fails, use just the email as the key instead

391

# If the lookup fails, use just the email as the key instead

392

# We call this commit2 as not to erase original commit fields

392

# We call this commit2 as not to erase original commit fields

393

commit2 = mailmapping(email=commit.email)

393

commit2 = mailmapping(email=commit.email)

394

proper = mailmap.get(commit2, mailmapping(None, None))

394

proper = mailmap.get(commit2, mailmapping(None, None))

395

396

# Return the author field with proper values filled in

396

# Return the author field with proper values filled in

397

return '%s <%s>' % (

397

return '%s <%s>' % (

398

proper.name if proper.name else commit.name,

398

proper.name if proper.name else commit.name,

399

proper.email if proper.email else commit.email,

399

proper.email if proper.email else commit.email,

400

)

400

)

401

402

_correctauthorformat = remod.compile(br'^[^<]+\s\<[^<>]+@[^<>]+\>$')

402

_correctauthorformat = remod.compile(br'^[^<]+\s\<[^<>]+@[^<>]+\>$')

403

404

def isauthorwellformed(author):

404

def isauthorwellformed(author):

405

'''Return True if the author field is well formed

405

'''Return True if the author field is well formed

406

(ie "Contributor Name <contrib@email.dom>")

406

(ie "Contributor Name <contrib@email.dom>")

407

408

>>> isauthorwellformed(b'Good Author <good@author.com>')

408

>>> isauthorwellformed(b'Good Author <good@author.com>')

409

True

409

True

410

>>> isauthorwellformed(b'Author <good@author.com>')

410

>>> isauthorwellformed(b'Author <good@author.com>')

411

True

411

True

412

>>> isauthorwellformed(b'Bad Author')

412

>>> isauthorwellformed(b'Bad Author')

413

False

413

False

414

>>> isauthorwellformed(b'Bad Author <author@author.com')

414

>>> isauthorwellformed(b'Bad Author <author@author.com')

415

False

415

False

416

>>> isauthorwellformed(b'Bad Author author@author.com')

416

>>> isauthorwellformed(b'Bad Author author@author.com')

417

False

417

False

418

>>> isauthorwellformed(b'<author@author.com>')

418

>>> isauthorwellformed(b'<author@author.com>')

419

False

419

False

420

>>> isauthorwellformed(b'Bad Author <author>')

420

>>> isauthorwellformed(b'Bad Author <author>')

421

False

421

False

422

'''

422

'''

423

return _correctauthorformat.match(author) is not None

423

return _correctauthorformat.match(author) is not None

424

425

def ellipsis(text, maxlength=400):

425

def ellipsis(text, maxlength=400):

426

"""Trim string to at most maxlength (default: 400) columns in display."""

426

"""Trim string to at most maxlength (default: 400) columns in display."""

427

return encoding.trim(text, maxlength, ellipsis='...')

427

return encoding.trim(text, maxlength, ellipsis='...')

428

429

def escapestr(s):

429

def escapestr(s):

430

# call underlying function of s.encode('string_escape') directly for

430

# call underlying function of s.encode('string_escape') directly for

431

# Python 3 compatibility

431

# Python 3 compatibility

432

return codecs.escape_encode(s)[0]

432

return codecs.escape_encode(s)[0]

433

434

def unescapestr(s):

434

def unescapestr(s):

435

return codecs.escape_decode(s)[0]

435

return codecs.escape_decode(s)[0]

436

437

def forcebytestr(obj):

437

def forcebytestr(obj):

438

"""Portably format an arbitrary object (e.g. exception) into a byte

438

"""Portably format an arbitrary object (e.g. exception) into a byte

439

string."""

439

string."""

440

try:

440

try:

441

return pycompat.bytestr(obj)

441

return pycompat.bytestr(obj)

442

except UnicodeEncodeError:

442

except UnicodeEncodeError:

443

# non-ascii string, may be lossy

443

# non-ascii string, may be lossy

444

return pycompat.bytestr(encoding.strtolocal(str(obj)))

444

return pycompat.bytestr(encoding.strtolocal(str(obj)))

445

446

def uirepr(s):

446

def uirepr(s):

447

# Avoid double backslash in Windows path repr()

447

# Avoid double backslash in Windows path repr()

448

return pycompat.byterepr(pycompat.bytestr(s)).replace(b'\\\\', b'\\')

448

return pycompat.byterepr(pycompat.bytestr(s)).replace(b'\\\\', b'\\')

449

450

# delay import of textwrap

450

# delay import of textwrap

451

def _MBTextWrapper(**kwargs):

451

def _MBTextWrapper(**kwargs):

452

class tw(textwrap.TextWrapper):

452

class tw(textwrap.TextWrapper):

453

"""

453

"""

454

Extend TextWrapper for width-awareness.

454

Extend TextWrapper for width-awareness.

455

456

Neither number of 'bytes' in any encoding nor 'characters' is

456

Neither number of 'bytes' in any encoding nor 'characters' is

457

appropriate to calculate terminal columns for specified string.

457

appropriate to calculate terminal columns for specified string.

458

459

Original TextWrapper implementation uses built-in 'len()' directly,

459

Original TextWrapper implementation uses built-in 'len()' directly,

460

so overriding is needed to use width information of each characters.

460

so overriding is needed to use width information of each characters.

461

462

In addition, characters classified into 'ambiguous' width are

462

In addition, characters classified into 'ambiguous' width are

463

treated as wide in East Asian area, but as narrow in other.

463

treated as wide in East Asian area, but as narrow in other.

464

465

This requires use decision to determine width of such characters.

465

This requires use decision to determine width of such characters.

466

"""

466

"""

467

def _cutdown(self, ucstr, space_left):

467

def _cutdown(self, ucstr, space_left):

468

l = 0

468

l = 0

469

colwidth = encoding.ucolwidth

469

colwidth = encoding.ucolwidth

470

for i in pycompat.xrange(len(ucstr)):

470

for i in pycompat.xrange(len(ucstr)):

471

l += colwidth(ucstr[i])

471

l += colwidth(ucstr[i])

472

if space_left < l:

472

if space_left < l:

473

return (ucstr[:i], ucstr[i:])

473

return (ucstr[:i], ucstr[i:])

474

return ucstr, ''

474

return ucstr, ''

475

476

# overriding of base class

476

# overriding of base class

477

def _handle_long_word(self, reversed_chunks, cur_line, cur_len, width):

477

def _handle_long_word(self, reversed_chunks, cur_line, cur_len, width):

478

space_left = max(width - cur_len, 1)

478

space_left = max(width - cur_len, 1)

479

480

if self.break_long_words:

480

if self.break_long_words:

481

cut, res = self._cutdown(reversed_chunks[-1], space_left)

481

cut, res = self._cutdown(reversed_chunks[-1], space_left)

482

cur_line.append(cut)

482

cur_line.append(cut)

483

reversed_chunks[-1] = res

483

reversed_chunks[-1] = res

484

elif not cur_line:

484

elif not cur_line:

485

cur_line.append(reversed_chunks.pop())

485

cur_line.append(reversed_chunks.pop())

486

487

# this overriding code is imported from TextWrapper of Python 2.6

487

# this overriding code is imported from TextWrapper of Python 2.6

488

# to calculate columns of string by 'encoding.ucolwidth()'

488

# to calculate columns of string by 'encoding.ucolwidth()'

489

def _wrap_chunks(self, chunks):

489

def _wrap_chunks(self, chunks):

490

colwidth = encoding.ucolwidth

490

colwidth = encoding.ucolwidth

491

492

lines = []

492

lines = []

493

if self.width <= 0:

493

if self.width <= 0:

494

raise ValueError("invalid width %r (must be > 0)" % self.width)

494

raise ValueError("invalid width %r (must be > 0)" % self.width)

495

496

# Arrange in reverse order so items can be efficiently popped

496

# Arrange in reverse order so items can be efficiently popped

497

# from a stack of chucks.

497

# from a stack of chucks.

498

chunks.reverse()

498

chunks.reverse()

499

500

while chunks:

500

while chunks:

501

502

# Start the list of chunks that will make up the current line.

502

# Start the list of chunks that will make up the current line.

503

# cur_len is just the length of all the chunks in cur_line.

503

# cur_len is just the length of all the chunks in cur_line.

504

cur_line = []

504

cur_line = []

505

cur_len = 0

505

cur_len = 0

506

507

# Figure out which static string will prefix this line.

507

# Figure out which static string will prefix this line.

508

if lines:

508

if lines:

509

indent = self.subsequent_indent

509

indent = self.subsequent_indent

510

else:

510

else:

511

indent = self.initial_indent

511

indent = self.initial_indent

512

513

# Maximum width for this line.

513

# Maximum width for this line.

514

width = self.width - len(indent)

514

width = self.width - len(indent)

515

516

# First chunk on line is whitespace -- drop it, unless this

516

# First chunk on line is whitespace -- drop it, unless this

517

# is the very beginning of the text (i.e. no lines started yet).

517

# is the very beginning of the text (i.e. no lines started yet).

518

if self.drop_whitespace and chunks[-1].strip() == r'' and lines:

518

if self.drop_whitespace and chunks[-1].strip() == r'' and lines:

519

del chunks[-1]

519

del chunks[-1]

520

521

while chunks:

521

while chunks:

522

l = colwidth(chunks[-1])

522

l = colwidth(chunks[-1])

523

524

# Can at least squeeze this chunk onto the current line.

524

# Can at least squeeze this chunk onto the current line.

525

if cur_len + l <= width:

525

if cur_len + l <= width:

526

cur_line.append(chunks.pop())

526

cur_line.append(chunks.pop())

527

cur_len += l

527

cur_len += l

528

529

# Nope, this line is full.

529

# Nope, this line is full.

530

else:

530

else:

531

break

531

break

532

533

# The current line is full, and the next chunk is too big to

533

# The current line is full, and the next chunk is too big to

534

# fit on *any* line (not just this one).

534

# fit on *any* line (not just this one).

535

if chunks and colwidth(chunks[-1]) > width:

535

if chunks and colwidth(chunks[-1]) > width:

536

self._handle_long_word(chunks, cur_line, cur_len, width)

536

self._handle_long_word(chunks, cur_line, cur_len, width)

537

538

# If the last chunk on this line is all whitespace, drop it.

538

# If the last chunk on this line is all whitespace, drop it.

539

if (self.drop_whitespace and

539

if (self.drop_whitespace and

540

cur_line and cur_line[-1].strip() == r''):

540

cur_line and cur_line[-1].strip() == r''):

541

del cur_line[-1]

541

del cur_line[-1]

542

543

# Convert current line back to a string and store it in list

543

# Convert current line back to a string and store it in list

544

# of all lines (return value).

544

# of all lines (return value).

545

if cur_line:

545

if cur_line:

546

lines.append(indent + r''.join(cur_line))

546

lines.append(indent + r''.join(cur_line))

547

548

return lines

548

return lines

549

550

global _MBTextWrapper

550

global _MBTextWrapper

551

_MBTextWrapper = tw

551

_MBTextWrapper = tw

552

return tw(**kwargs)

552

return tw(**kwargs)

553

554

def wrap(line, width, initindent='', hangindent=''):

554

def wrap(line, width, initindent='', hangindent=''):

555

maxindent = max(len(hangindent), len(initindent))

555

maxindent = max(len(hangindent), len(initindent))

556

if width <= maxindent:

556

if width <= maxindent:

557

# adjust for weird terminal size

557

# adjust for weird terminal size

558

width = max(78, maxindent + 1)

558

width = max(78, maxindent + 1)

559

line = line.decode(pycompat.sysstr(encoding.encoding),

559

line = line.decode(pycompat.sysstr(encoding.encoding),

560

pycompat.sysstr(encoding.encodingmode))

560

pycompat.sysstr(encoding.encodingmode))

561

initindent = initindent.decode(pycompat.sysstr(encoding.encoding),

561

initindent = initindent.decode(pycompat.sysstr(encoding.encoding),

562

pycompat.sysstr(encoding.encodingmode))

562

pycompat.sysstr(encoding.encodingmode))

563

hangindent = hangindent.decode(pycompat.sysstr(encoding.encoding),

563

hangindent = hangindent.decode(pycompat.sysstr(encoding.encoding),

564

pycompat.sysstr(encoding.encodingmode))

564

pycompat.sysstr(encoding.encodingmode))

565

wrapper = _MBTextWrapper(width=width,

565

wrapper = _MBTextWrapper(width=width,

566

initial_indent=initindent,

566

initial_indent=initindent,

567

subsequent_indent=hangindent)

567

subsequent_indent=hangindent)

568

return wrapper.fill(line).encode(pycompat.sysstr(encoding.encoding))

568

return wrapper.fill(line).encode(pycompat.sysstr(encoding.encoding))

569

570

_booleans = {'1': True, 'yes': True, 'true': True, 'on': True, 'always': True,

570

_booleans = {'1': True, 'yes': True, 'true': True, 'on': True, 'always': True,

571

'0': False, 'no': False, 'false': False, 'off': False,

571

'0': False, 'no': False, 'false': False, 'off': False,

572

'never': False}

572

'never': False}

573

574

def parsebool(s):

574

def parsebool(s):

575

"""Parse s into a boolean.

575

"""Parse s into a boolean.

576

577

If s is not a valid boolean, returns None.

577

If s is not a valid boolean, returns None.

578

"""

578

"""

579

return _booleans.get(s.lower(), None)

579

return _booleans.get(s.lower(), None)

580

581

def evalpythonliteral(s):

581

def evalpythonliteral(s):

582

"""Evaluate a string containing a Python literal expression"""

582

"""Evaluate a string containing a Python literal expression"""

583

# We could backport our tokenizer hack to rewrite '' to u'' if we want

583

# We could backport our tokenizer hack to rewrite '' to u'' if we want

584

if pycompat.ispy3:

584

if pycompat.ispy3:

585

return ast.literal_eval(s.decode('latin1'))

585

return ast.literal_eval(s.decode('latin1'))

586

return ast.literal_eval(s)

586

return ast.literal_eval(s)

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages

             # stringutil.py - utility for generic string formatting, parsing, etc.
             #
             #  Copyright 2005 K. Thananchayan <thananck@yahoo.com>
             #  Copyright 2005-2007 Matt Mackall <mpm@selenic.com>
             #  Copyright 2006 Vadim Gelfer <vadim.gelfer@gmail.com>
             #
             # This software may be used and distributed according to the terms of the
             # GNU General Public License version 2 or any later version.
             from __future__ import absolute_import
             import ast
             import codecs
             import re as remod
             import textwrap
             from ..i18n import _
             from ..thirdparty import attr
             from .. import (
                 encoding,
                 error,
                 pycompat,
             )
             # regex special chars pulled from https://bugs.python.org/issue29995
             # which was part of Python 3.7.
             _respecial = pycompat.bytestr(b'()[]{}?*+-|^$\\.&~# \t\n\r\v\f')
             _regexescapemap = {ord(i): (b'\\' + i).decode('latin1') for i in _respecial}
             def reescape(pat):
                 """Drop-in replacement for re.escape."""
                 # NOTE: it is intentional that this works on unicodes and not
                 # bytes, as it's only possible to do the escaping with
                 # unicode.translate, not bytes.translate. Sigh.
                 wantuni = True
                 if isinstance(pat, bytes):
                     wantuni = False
                     pat = pat.decode('latin1')
                 pat = pat.translate(_regexescapemap)
                 if wantuni:
                     return pat
                 return pat.encode('latin1')
             def pprint(o, bprefix=False):
                 """Pretty print an object."""
                 if isinstance(o, bytes):
                     if bprefix:
                         return "b'%s'" % escapestr(o)
                     return "'%s'" % escapestr(o)
                 elif isinstance(o, bytearray):
                     # codecs.escape_encode() can't handle bytearray, so escapestr fails
                     # without coercion.
                     return "bytearray['%s']" % escapestr(bytes(o))
                 elif isinstance(o, list):
                     return '[%s]' % (b', '.join(pprint(a, bprefix=bprefix) for a in o))
                 elif isinstance(o, dict):
                     return '{%s}' % (b', '.join(
                         '%s: %s' % (pprint(k, bprefix=bprefix),
                                     pprint(v, bprefix=bprefix))
                         for k, v in sorted(o.items())))
                 elif isinstance(o, set):
                     return 'set([%s])' % (b', '.join(
                         pprint(k, bprefix=bprefix) for k in sorted(o)))
                 elif isinstance(o, tuple):
                     return '(%s)' % (b', '.join(pprint(a, bprefix=bprefix) for a in o))
                 else:
                     return pycompat.byterepr(o)
             def prettyrepr(o):
                 """Pretty print a representation of a possibly-nested object"""
                 lines = []
                 rs = pycompat.byterepr(o)
                 p0 = p1 = 0
                 while p0 < len(rs):
                     # '... field=<type ... field=<type ...'
                     #      ~~~~~~~~~~~~~~~~
                     #      p0    p1        q0    q1
                     q0 = -1
                     q1 = rs.find('<', p1 + 1)
                     if q1 < 0:
                         q1 = len(rs)
                     elif q1 > p1 + 1 and rs.startswith('=', q1 - 1):
                         # backtrack for ' field=<'
                         q0 = rs.rfind(' ', p1 + 1, q1 - 1)
                     if q0 < 0:
                         q0 = q1
                     else:
                         q0 += 1  # skip ' '
                     l = rs.count('<', 0, p0) - rs.count('>', 0, p0)
                     assert l >= 0
                     lines.append((l, rs[p0:q0].rstrip()))
                     p0, p1 = q0, q1
                 return '\n'.join('  ' * l + s for l, s in lines)
             def buildrepr(r):
                 """Format an optional printable representation from unexpanded bits
                 ========  =================================
                 type(r)   example
                 ========  =================================
                 tuple     ('<not %r>', other)
                 bytes     '<branch closed>'
                 callable  lambda: '<branch %r>' % sorted(b)
                 object    other
                 ========  =================================
                 """
                 if r is None:
                     return ''
                 elif isinstance(r, tuple):
                     return r[0] % pycompat.rapply(pycompat.maybebytestr, r[1:])
                 elif isinstance(r, bytes):
                     return r
                 elif callable(r):
                     return r()
                 else:
-                    return pycompat.byterepr(r)
+                    return pprint(r)
             def binary(s):
                 """return true if a string is binary data"""
                 return bool(s and '\0' in s)
             def stringmatcher(pattern, casesensitive=True):
                 """
                 accepts a string, possibly starting with 're:' or 'literal:' prefix.
                 returns the matcher name, pattern, and matcher function.
                 missing or unknown prefixes are treated as literal matches.
                 helper for tests:
                 >>> def test(pattern, *tests):
                 ...     kind, pattern, matcher = stringmatcher(pattern)
                 ...     return (kind, pattern, [bool(matcher(t)) for t in tests])
                 >>> def itest(pattern, *tests):
                 ...     kind, pattern, matcher = stringmatcher(pattern, casesensitive=False)
                 ...     return (kind, pattern, [bool(matcher(t)) for t in tests])
                 exact matching (no prefix):
                 >>> test(b'abcdefg', b'abc', b'def', b'abcdefg')
                 ('literal', 'abcdefg', [False, False, True])
                 regex matching ('re:' prefix)
                 >>> test(b're:a.+b', b'nomatch', b'fooadef', b'fooadefbar')
                 ('re', 'a.+b', [False, False, True])
                 force exact matches ('literal:' prefix)
                 >>> test(b'literal:re:foobar', b'foobar', b're:foobar')
                 ('literal', 're:foobar', [False, True])
                 unknown prefixes are ignored and treated as literals
                 >>> test(b'foo:bar', b'foo', b'bar', b'foo:bar')
                 ('literal', 'foo:bar', [False, False, True])
                 case insensitive regex matches
                 >>> itest(b're:A.+b', b'nomatch', b'fooadef', b'fooadefBar')
                 ('re', 'A.+b', [False, False, True])
                 case insensitive literal matches
                 >>> itest(b'ABCDEFG', b'abc', b'def', b'abcdefg')
                 ('literal', 'ABCDEFG', [False, False, True])
                 """
                 if pattern.startswith('re:'):
                     pattern = pattern[3:]
                     try:
                         flags = 0
                         if not casesensitive:
                             flags = remod.I
                         regex = remod.compile(pattern, flags)
                     except remod.error as e:
                         raise error.ParseError(_('invalid regular expression: %s')
                                                % e)
                     return 're', pattern, regex.search
                 elif pattern.startswith('literal:'):
                     pattern = pattern[8:]
                 match = pattern.__eq__
                 if not casesensitive:
                     ipat = encoding.lower(pattern)
                     match = lambda s: ipat == encoding.lower(s)
                 return 'literal', pattern, match
             def shortuser(user):
                 """Return a short representation of a user name or email address."""
                 f = user.find('@')
                 if f >= 0:
                     user = user[:f]
                 f = user.find('<')
                 if f >= 0:
                     user = user[f + 1:]
                 f = user.find(' ')
                 if f >= 0:
                     user = user[:f]
                 f = user.find('.')
                 if f >= 0:
                     user = user[:f]
                 return user
             def emailuser(user):
                 """Return the user portion of an email address."""
                 f = user.find('@')
                 if f >= 0:
                     user = user[:f]
                 f = user.find('<')
                 if f >= 0:
                     user = user[f + 1:]
                 return user
             def email(author):
                 '''get email of author.'''
                 r = author.find('>')
                 if r == -1:
                     r = None
                 return author[author.find('<') + 1:r]
             def person(author):
                 """Returns the name before an email address,
                 interpreting it as per RFC 5322
                 >>> person(b'foo@bar')
                 'foo'
                 >>> person(b'Foo Bar <foo@bar>')
                 'Foo Bar'
                 >>> person(b'"Foo Bar" <foo@bar>')
                 'Foo Bar'
                 >>> person(b'"Foo \"buz\" Bar" <foo@bar>')
                 'Foo "buz" Bar'
                 >>> # The following are invalid, but do exist in real-life
                 ...
                 >>> person(b'Foo "buz" Bar <foo@bar>')
                 'Foo "buz" Bar'
                 >>> person(b'"Foo Bar <foo@bar>')
                 'Foo Bar'
                 """
                 if '@' not in author:
                     return author
                 f = author.find('<')
                 if f != -1:
                     return author[:f].strip(' "').replace('\\"', '"')
                 f = author.find('@')
                 return author[:f].replace('.', ' ')
             @attr.s(hash=True)
             class mailmapping(object):
                 '''Represents a username/email key or value in
                 a mailmap file'''
                 email = attr.ib()
                 name = attr.ib(default=None)
             def _ismailmaplineinvalid(names, emails):
                 '''Returns True if the parsed names and emails
                 in a mailmap entry are invalid.
                 >>> # No names or emails fails
                 >>> names, emails = [], []
                 >>> _ismailmaplineinvalid(names, emails)
                 True
                 >>> # Only one email fails
                 >>> emails = [b'email@email.com']
                 >>> _ismailmaplineinvalid(names, emails)
                 True
                 >>> # One email and one name passes
                 >>> names = [b'Test Name']
                 >>> _ismailmaplineinvalid(names, emails)
                 False
                 >>> # No names but two emails passes
                 >>> names = []
                 >>> emails = [b'proper@email.com', b'commit@email.com']
                 >>> _ismailmaplineinvalid(names, emails)
                 False
                 '''
                 return not emails or not names and len(emails) < 2
             def parsemailmap(mailmapcontent):
                 """Parses data in the .mailmap format
                 >>> mmdata = b"\\n".join([
                 ... b'# Comment',
                 ... b'Name <commit1@email.xx>',
                 ... b'<name@email.xx> <commit2@email.xx>',
                 ... b'Name <proper@email.xx> <commit3@email.xx>',
                 ... b'Name <proper@email.xx> Commit <commit4@email.xx>',
                 ... ])
                 >>> mm = parsemailmap(mmdata)
                 >>> for key in sorted(mm.keys()):
                 ...     print(key)
                 mailmapping(email='commit1@email.xx', name=None)
                 mailmapping(email='commit2@email.xx', name=None)
                 mailmapping(email='commit3@email.xx', name=None)
                 mailmapping(email='commit4@email.xx', name='Commit')
                 >>> for val in sorted(mm.values()):
                 ...     print(val)
                 mailmapping(email='commit1@email.xx', name='Name')
                 mailmapping(email='name@email.xx', name=None)
                 mailmapping(email='proper@email.xx', name='Name')
                 mailmapping(email='proper@email.xx', name='Name')
                 """
                 mailmap = {}
                 if mailmapcontent is None:
                     return mailmap
                 for line in mailmapcontent.splitlines():
                     # Don't bother checking the line if it is a comment or
                     # is an improperly formed author field
                     if line.lstrip().startswith('#'):
                         continue
                     # names, emails hold the parsed emails and names for each line
                     # name_builder holds the words in a persons name
                     names, emails = [], []
                     namebuilder = []
                     for element in line.split():
                         if element.startswith('#'):
                             # If we reach a comment in the mailmap file, move on
                             break
                         elif element.startswith('<') and element.endswith('>'):
                             # We have found an email.
                             # Parse it, and finalize any names from earlier
                             emails.append(element[1:-1])  # Slice off the "<>"
                             if namebuilder:
                                 names.append(' '.join(namebuilder))
                                 namebuilder = []
                             # Break if we have found a second email, any other
                             # data does not fit the spec for .mailmap
                             if len(emails) > 1:
                                 break
                         else:
                             # We have found another word in the committers name
                             namebuilder.append(element)
                     # Check to see if we have parsed the line into a valid form
                     # We require at least one email, and either at least one
                     # name or a second email
                     if _ismailmaplineinvalid(names, emails):
                         continue
                     mailmapkey = mailmapping(
                         email=emails[-1],
                         name=names[-1] if len(names) == 2 else None,
                     )
                     mailmap[mailmapkey] = mailmapping(
                         email=emails[0],
                         name=names[0] if names else None,
                     )
                 return mailmap
             def mapname(mailmap, author):
                 """Returns the author field according to the mailmap cache, or
                 the original author field.
                 >>> mmdata = b"\\n".join([
                 ...     b'# Comment',
                 ...     b'Name <commit1@email.xx>',
                 ...     b'<name@email.xx> <commit2@email.xx>',
                 ...     b'Name <proper@email.xx> <commit3@email.xx>',
                 ...     b'Name <proper@email.xx> Commit <commit4@email.xx>',
                 ... ])
                 >>> m = parsemailmap(mmdata)
                 >>> mapname(m, b'Commit <commit1@email.xx>')
                 'Name <commit1@email.xx>'
                 >>> mapname(m, b'Name <commit2@email.xx>')
                 'Name <name@email.xx>'
                 >>> mapname(m, b'Commit <commit3@email.xx>')
                 'Name <proper@email.xx>'
                 >>> mapname(m, b'Commit <commit4@email.xx>')
                 'Name <proper@email.xx>'
                 >>> mapname(m, b'Unknown Name <unknown@email.com>')
                 'Unknown Name <unknown@email.com>'
                 """
                 # If the author field coming in isn't in the correct format,
                 # or the mailmap is empty just return the original author field
                 if not isauthorwellformed(author) or not mailmap:
                     return author
                 # Turn the user name into a mailmapping
                 commit = mailmapping(name=person(author), email=email(author))
                 try:
                     # Try and use both the commit email and name as the key
                     proper = mailmap[commit]
                 except KeyError:
                     # If the lookup fails, use just the email as the key instead
                     # We call this commit2 as not to erase original commit fields
                     commit2 = mailmapping(email=commit.email)
                     proper = mailmap.get(commit2, mailmapping(None, None))
                 # Return the author field with proper values filled in
                 return '%s <%s>' % (
                     proper.name if proper.name else commit.name,
                     proper.email if proper.email else commit.email,
                 )
             _correctauthorformat = remod.compile(br'^[^<]+\s\<[^<>]+@[^<>]+\>$')
             def isauthorwellformed(author):
                 '''Return True if the author field is well formed
                 (ie "Contributor Name <contrib@email.dom>")
                 >>> isauthorwellformed(b'Good Author <good@author.com>')
                 True
                 >>> isauthorwellformed(b'Author <good@author.com>')
                 True
                 >>> isauthorwellformed(b'Bad Author')
                 False
                 >>> isauthorwellformed(b'Bad Author <author@author.com')
                 False
                 >>> isauthorwellformed(b'Bad Author author@author.com')
                 False
                 >>> isauthorwellformed(b'<author@author.com>')
                 False
                 >>> isauthorwellformed(b'Bad Author <author>')
                 False
                 '''
                 return _correctauthorformat.match(author) is not None
             def ellipsis(text, maxlength=400):
                 """Trim string to at most maxlength (default: 400) columns in display."""
                 return encoding.trim(text, maxlength, ellipsis='...')
             def escapestr(s):
                 # call underlying function of s.encode('string_escape') directly for
                 # Python 3 compatibility
                 return codecs.escape_encode(s)[0]
             def unescapestr(s):
                 return codecs.escape_decode(s)[0]
             def forcebytestr(obj):
                 """Portably format an arbitrary object (e.g. exception) into a byte
                 string."""
                 try:
                     return pycompat.bytestr(obj)
                 except UnicodeEncodeError:
                     # non-ascii string, may be lossy
                     return pycompat.bytestr(encoding.strtolocal(str(obj)))
             def uirepr(s):
                 # Avoid double backslash in Windows path repr()
                 return pycompat.byterepr(pycompat.bytestr(s)).replace(b'\\\\', b'\\')
             # delay import of textwrap
             def _MBTextWrapper(**kwargs):
                 class tw(textwrap.TextWrapper):
                     """
                     Extend TextWrapper for width-awareness.
                     Neither number of 'bytes' in any encoding nor 'characters' is
                     appropriate to calculate terminal columns for specified string.
                     Original TextWrapper implementation uses built-in 'len()' directly,
                     so overriding is needed to use width information of each characters.
                     In addition, characters classified into 'ambiguous' width are
                     treated as wide in East Asian area, but as narrow in other.
                     This requires use decision to determine width of such characters.
                     """
                     def _cutdown(self, ucstr, space_left):
                         l = 0
                         colwidth = encoding.ucolwidth
                         for i in pycompat.xrange(len(ucstr)):
                             l += colwidth(ucstr[i])
                             if space_left < l:
                                 return (ucstr[:i], ucstr[i:])
                         return ucstr, ''
                     # overriding of base class
                     def _handle_long_word(self, reversed_chunks, cur_line, cur_len, width):
                         space_left = max(width - cur_len, 1)
                         if self.break_long_words:
                             cut, res = self._cutdown(reversed_chunks[-1], space_left)
                             cur_line.append(cut)
                             reversed_chunks[-1] = res
                         elif not cur_line:
                             cur_line.append(reversed_chunks.pop())
                     # this overriding code is imported from TextWrapper of Python 2.6
                     # to calculate columns of string by 'encoding.ucolwidth()'
                     def _wrap_chunks(self, chunks):
                         colwidth = encoding.ucolwidth
                         lines = []
                         if self.width <= 0:
                             raise ValueError("invalid width %r (must be > 0)" % self.width)
                         # Arrange in reverse order so items can be efficiently popped
                         # from a stack of chucks.
                         chunks.reverse()
                         while chunks:
                             # Start the list of chunks that will make up the current line.
                             # cur_len is just the length of all the chunks in cur_line.
                             cur_line = []
                             cur_len = 0
                             # Figure out which static string will prefix this line.
                             if lines:
                                 indent = self.subsequent_indent
                             else:
                                 indent = self.initial_indent
                             # Maximum width for this line.
                             width = self.width - len(indent)
                             # First chunk on line is whitespace -- drop it, unless this
                             # is the very beginning of the text (i.e. no lines started yet).
                             if self.drop_whitespace and chunks[-1].strip() == r'' and lines:
                                 del chunks[-1]
                             while chunks:
                                 l = colwidth(chunks[-1])
                                 # Can at least squeeze this chunk onto the current line.
                                 if cur_len + l <= width:
                                     cur_line.append(chunks.pop())
                                     cur_len += l
                                 # Nope, this line is full.
                                 else:
                                     break
                             # The current line is full, and the next chunk is too big to
                             # fit on *any* line (not just this one).
                             if chunks and colwidth(chunks[-1]) > width:
                                 self._handle_long_word(chunks, cur_line, cur_len, width)
                             # If the last chunk on this line is all whitespace, drop it.
                             if (self.drop_whitespace and
                                 cur_line and cur_line[-1].strip() == r''):
                                 del cur_line[-1]
                             # Convert current line back to a string and store it in list
                             # of all lines (return value).
                             if cur_line:
                                 lines.append(indent + r''.join(cur_line))
                         return lines
                 global _MBTextWrapper
                 _MBTextWrapper = tw
                 return tw(**kwargs)
             def wrap(line, width, initindent='', hangindent=''):
                 maxindent = max(len(hangindent), len(initindent))
                 if width <= maxindent:
                     # adjust for weird terminal size
                     width = max(78, maxindent + 1)
                 line = line.decode(pycompat.sysstr(encoding.encoding),
                                    pycompat.sysstr(encoding.encodingmode))
                 initindent = initindent.decode(pycompat.sysstr(encoding.encoding),
                                                pycompat.sysstr(encoding.encodingmode))
                 hangindent = hangindent.decode(pycompat.sysstr(encoding.encoding),
                                                pycompat.sysstr(encoding.encodingmode))
                 wrapper = _MBTextWrapper(width=width,
                                          initial_indent=initindent,
                                          subsequent_indent=hangindent)
                 return wrapper.fill(line).encode(pycompat.sysstr(encoding.encoding))
             _booleans = {'1': True, 'yes': True, 'true': True, 'on': True, 'always': True,
                          '0': False, 'no': False, 'false': False, 'off': False,
                          'never': False}
             def parsebool(s):
                 """Parse s into a boolean.
                 If s is not a valid boolean, returns None.
                 """
                 return _booleans.get(s.lower(), None)
             def evalpythonliteral(s):
                 """Evaluate a string containing a Python literal expression"""
                 # We could backport our tokenizer hack to rewrite '' to u'' if we want
                 if pycompat.ispy3:
                     return ast.literal_eval(s.decode('latin1'))
                 return ast.literal_eval(s)