upstream/mercurial-mirror Commit - r39389:0d21b1f1

1

# stringutil.py - utility for generic string formatting, parsing, etc.

1

# stringutil.py - utility for generic string formatting, parsing, etc.

2

#

2

#

3

4

5

6

#

6

#

7

# This software may be used and distributed according to the terms of the

7

# This software may be used and distributed according to the terms of the

8

# GNU General Public License version 2 or any later version.

8

# GNU General Public License version 2 or any later version.

9

10

from __future__ import absolute_import

10

from __future__ import absolute_import

11

12

import ast

12

import ast

13

import codecs

13

import codecs

14

import re as remod

14

import re as remod

15

import textwrap

15

import textwrap

16

import types

16

import types

17

18

from ..i18n import _

18

from ..i18n import _

19

from ..thirdparty import attr

19

from ..thirdparty import attr

20

21

from .. import (

21

from .. import (

22

encoding,

22

encoding,

23

error,

23

error,

24

pycompat,

24

pycompat,

25

)

25

)

26

27

# regex special chars pulled from https://bugs.python.org/issue29995

27

# regex special chars pulled from https://bugs.python.org/issue29995

28

# which was part of Python 3.7.

28

# which was part of Python 3.7.

29

_respecial = pycompat.bytestr(b'()[]{}?*+-|^$\\.&~# \t\n\r\v\f')

29

_respecial = pycompat.bytestr(b'()[]{}?*+-|^$\\.&~# \t\n\r\v\f')

30

_regexescapemap = {ord(i): (b'\\' + i).decode('latin1') for i in _respecial}

30

_regexescapemap = {ord(i): (b'\\' + i).decode('latin1') for i in _respecial}

31

32

def reescape(pat):

32

def reescape(pat):

33

"""Drop-in replacement for re.escape."""

33

"""Drop-in replacement for re.escape."""

34

# NOTE: it is intentional that this works on unicodes and not

34

# NOTE: it is intentional that this works on unicodes and not

35

# bytes, as it's only possible to do the escaping with

35

# bytes, as it's only possible to do the escaping with

36

# unicode.translate, not bytes.translate. Sigh.

36

# unicode.translate, not bytes.translate. Sigh.

37

wantuni = True

37

wantuni = True

38

if isinstance(pat, bytes):

38

if isinstance(pat, bytes):

39

wantuni = False

39

wantuni = False

40

pat = pat.decode('latin1')

40

pat = pat.decode('latin1')

41

pat = pat.translate(_regexescapemap)

41

pat = pat.translate(_regexescapemap)

42

if wantuni:

42

if wantuni:

43

return pat

43

return pat

44

return pat.encode('latin1')

44

return pat.encode('latin1')

45

46

def pprint(o, bprefix=False):

46

def pprint(o, bprefix=False):

47

"""Pretty print an object."""

47

"""Pretty print an object."""

48

return b''.join(pprintgen(o, bprefix=bprefix))

49

50

def pprintgen(o, bprefix=False):

51

"""Pretty print an object to a generator of atoms."""

52

48

if isinstance(o, bytes):

53

if isinstance(o, bytes):

49

if bprefix:

54

if bprefix:

50

~~return~~ "b'%s'" % escapestr(o)

55

yield "b'%s'" % escapestr(o)

51

return "'%s'" % escapestr(o)

56

else:

57

yield "'%s'" % escapestr(o)

52

elif isinstance(o, bytearray):

58

elif isinstance(o, bytearray):

53

# codecs.escape_encode() can't handle bytearray, so escapestr fails

59

# codecs.escape_encode() can't handle bytearray, so escapestr fails

54

# without coercion.

60

# without coercion.

55

~~return~~ "bytearray['%s']" % escapestr(bytes(o))

61

yield "bytearray['%s']" % escapestr(bytes(o))

56

elif isinstance(o, list):

62

elif isinstance(o, list):

57

~~return~~ '[%s]' % (b', '.join(pprint(a, bprefix=bprefix) for a in o))

63

yield '[%s]' % (b', '.join(pprint(a, bprefix=bprefix) for a in o))

58

elif isinstance(o, dict):

64

elif isinstance(o, dict):

59

~~return~~ '{%s}' % (b', '.join(

65

yield '{%s}' % (b', '.join(

60

'%s: %s' % (pprint(k, bprefix=bprefix),

66

'%s: %s' % (pprint(k, bprefix=bprefix),

61

pprint(v, bprefix=bprefix))

67

pprint(v, bprefix=bprefix))

62

for k, v in sorted(o.items())))

68

for k, v in sorted(o.items())))

63

elif isinstance(o, set):

69

elif isinstance(o, set):

64

~~return~~ 'set([%s])' % (b', '.join(

70

yield 'set([%s])' % (b', '.join(

65

pprint(k, bprefix=bprefix) for k in sorted(o)))

71

pprint(k, bprefix=bprefix) for k in sorted(o)))

66

elif isinstance(o, tuple):

72

elif isinstance(o, tuple):

67

~~return~~ '(%s)' % (b', '.join(pprint(a, bprefix=bprefix) for a in o))

73

yield '(%s)' % (b', '.join(pprint(a, bprefix=bprefix) for a in o))

68

elif isinstance(o, types.GeneratorType):

74

elif isinstance(o, types.GeneratorType):

69

~~return~~ 'gen[%s]' % (b', '.join(pprint(a, bprefix=bprefix) for a in o))

75

yield 'gen[%s]' % (b', '.join(pprint(a, bprefix=bprefix) for a in o))

70

else:

76

else:

71

~~return~~ pycompat.byterepr(o)

77

yield pycompat.byterepr(o)

72

78

73

def prettyrepr(o):

79

def prettyrepr(o):

74

"""Pretty print a representation of a possibly-nested object"""

80

"""Pretty print a representation of a possibly-nested object"""

75

lines = []

81

lines = []

76

rs = pycompat.byterepr(o)

82

rs = pycompat.byterepr(o)

77

p0 = p1 = 0

83

p0 = p1 = 0

78

while p0 < len(rs):

84

while p0 < len(rs):

79

# '... field=<type ... field=<type ...'

85

# '... field=<type ... field=<type ...'

80

# ~~~~~~~~~~~~~~~~

86

# ~~~~~~~~~~~~~~~~

81

# p0 p1 q0 q1

87

# p0 p1 q0 q1

82

q0 = -1

88

q0 = -1

83

q1 = rs.find('<', p1 + 1)

89

q1 = rs.find('<', p1 + 1)

84

if q1 < 0:

90

if q1 < 0:

85

q1 = len(rs)

91

q1 = len(rs)

86

elif q1 > p1 + 1 and rs.startswith('=', q1 - 1):

92

elif q1 > p1 + 1 and rs.startswith('=', q1 - 1):

87

# backtrack for ' field=<'

93

# backtrack for ' field=<'

88

q0 = rs.rfind(' ', p1 + 1, q1 - 1)

94

q0 = rs.rfind(' ', p1 + 1, q1 - 1)

89

if q0 < 0:

95

if q0 < 0:

90

q0 = q1

96

q0 = q1

91

else:

97

else:

92

q0 += 1 # skip ' '

98

q0 += 1 # skip ' '

93

l = rs.count('<', 0, p0) - rs.count('>', 0, p0)

99

l = rs.count('<', 0, p0) - rs.count('>', 0, p0)

94

assert l >= 0

100

assert l >= 0

95

lines.append((l, rs[p0:q0].rstrip()))

101

lines.append((l, rs[p0:q0].rstrip()))

96

p0, p1 = q0, q1

102

p0, p1 = q0, q1

97

return '\n'.join(' ' * l + s for l, s in lines)

103

return '\n'.join(' ' * l + s for l, s in lines)

98

104

99

def buildrepr(r):

105

def buildrepr(r):

100

"""Format an optional printable representation from unexpanded bits

106

"""Format an optional printable representation from unexpanded bits

101

107

102

======== =================================

108

======== =================================

103

type(r) example

109

type(r) example

104

======== =================================

110

======== =================================

105

tuple ('<not %r>', other)

111

tuple ('<not %r>', other)

106

bytes '<branch closed>'

112

bytes '<branch closed>'

107

callable lambda: '<branch %r>' % sorted(b)

113

callable lambda: '<branch %r>' % sorted(b)

108

object other

114

object other

109

======== =================================

115

======== =================================

110

"""

116

"""

111

if r is None:

117

if r is None:

112

return ''

118

return ''

113

elif isinstance(r, tuple):

119

elif isinstance(r, tuple):

114

return r[0] % pycompat.rapply(pycompat.maybebytestr, r[1:])

120

return r[0] % pycompat.rapply(pycompat.maybebytestr, r[1:])

115

elif isinstance(r, bytes):

121

elif isinstance(r, bytes):

116

return r

122

return r

117

elif callable(r):

123

elif callable(r):

118

return r()

124

return r()

119

else:

125

else:

120

return pprint(r)

126

return pprint(r)

121

127

122

def binary(s):

128

def binary(s):

123

"""return true if a string is binary data"""

129

"""return true if a string is binary data"""

124

return bool(s and '\0' in s)

130

return bool(s and '\0' in s)

125

131

126

def stringmatcher(pattern, casesensitive=True):

132

def stringmatcher(pattern, casesensitive=True):

127

"""

133

"""

128

accepts a string, possibly starting with 're:' or 'literal:' prefix.

134

accepts a string, possibly starting with 're:' or 'literal:' prefix.

129

returns the matcher name, pattern, and matcher function.

135

returns the matcher name, pattern, and matcher function.

130

missing or unknown prefixes are treated as literal matches.

136

missing or unknown prefixes are treated as literal matches.

131

137

132

helper for tests:

138

helper for tests:

133

>>> def test(pattern, *tests):

139

>>> def test(pattern, *tests):

134

... kind, pattern, matcher = stringmatcher(pattern)

140

... kind, pattern, matcher = stringmatcher(pattern)

135

... return (kind, pattern, [bool(matcher(t)) for t in tests])

141

... return (kind, pattern, [bool(matcher(t)) for t in tests])

136

>>> def itest(pattern, *tests):

142

>>> def itest(pattern, *tests):

137

... kind, pattern, matcher = stringmatcher(pattern, casesensitive=False)

143

... kind, pattern, matcher = stringmatcher(pattern, casesensitive=False)

138

... return (kind, pattern, [bool(matcher(t)) for t in tests])

144

... return (kind, pattern, [bool(matcher(t)) for t in tests])

139

145

140

exact matching (no prefix):

146

exact matching (no prefix):

141

>>> test(b'abcdefg', b'abc', b'def', b'abcdefg')

147

>>> test(b'abcdefg', b'abc', b'def', b'abcdefg')

142

('literal', 'abcdefg', [False, False, True])

148

('literal', 'abcdefg', [False, False, True])

143

149

144

regex matching ('re:' prefix)

150

regex matching ('re:' prefix)

145

>>> test(b're:a.+b', b'nomatch', b'fooadef', b'fooadefbar')

151

>>> test(b're:a.+b', b'nomatch', b'fooadef', b'fooadefbar')

146

('re', 'a.+b', [False, False, True])

152

('re', 'a.+b', [False, False, True])

147

153

148

force exact matches ('literal:' prefix)

154

force exact matches ('literal:' prefix)

149

>>> test(b'literal:re:foobar', b'foobar', b're:foobar')

155

>>> test(b'literal:re:foobar', b'foobar', b're:foobar')

150

('literal', 're:foobar', [False, True])

156

('literal', 're:foobar', [False, True])

151

157

152

unknown prefixes are ignored and treated as literals

158

unknown prefixes are ignored and treated as literals

153

>>> test(b'foo:bar', b'foo', b'bar', b'foo:bar')

159

>>> test(b'foo:bar', b'foo', b'bar', b'foo:bar')

154

('literal', 'foo:bar', [False, False, True])

160

('literal', 'foo:bar', [False, False, True])

155

161

156

case insensitive regex matches

162

case insensitive regex matches

157

>>> itest(b're:A.+b', b'nomatch', b'fooadef', b'fooadefBar')

163

>>> itest(b're:A.+b', b'nomatch', b'fooadef', b'fooadefBar')

158

('re', 'A.+b', [False, False, True])

164

('re', 'A.+b', [False, False, True])

159

165

160

case insensitive literal matches

166

case insensitive literal matches

161

>>> itest(b'ABCDEFG', b'abc', b'def', b'abcdefg')

167

>>> itest(b'ABCDEFG', b'abc', b'def', b'abcdefg')

162

('literal', 'ABCDEFG', [False, False, True])

168

('literal', 'ABCDEFG', [False, False, True])

163

"""

169

"""

164

if pattern.startswith('re:'):

170

if pattern.startswith('re:'):

165

pattern = pattern[3:]

171

pattern = pattern[3:]

166

try:

172

try:

167

flags = 0

173

flags = 0

168

if not casesensitive:

174

if not casesensitive:

169

flags = remod.I

175

flags = remod.I

170

regex = remod.compile(pattern, flags)

176

regex = remod.compile(pattern, flags)

171

except remod.error as e:

177

except remod.error as e:

172

raise error.ParseError(_('invalid regular expression: %s')

178

raise error.ParseError(_('invalid regular expression: %s')

173

% e)

179

% e)

174

return 're', pattern, regex.search

180

return 're', pattern, regex.search

175

elif pattern.startswith('literal:'):

181

elif pattern.startswith('literal:'):

176

pattern = pattern[8:]

182

pattern = pattern[8:]

177

183

178

match = pattern.__eq__

184

match = pattern.__eq__

179

185

180

if not casesensitive:

186

if not casesensitive:

181

ipat = encoding.lower(pattern)

187

ipat = encoding.lower(pattern)

182

match = lambda s: ipat == encoding.lower(s)

188

match = lambda s: ipat == encoding.lower(s)

183

return 'literal', pattern, match

189

return 'literal', pattern, match

184

190

185

def shortuser(user):

191

def shortuser(user):

186

"""Return a short representation of a user name or email address."""

192

"""Return a short representation of a user name or email address."""

187

f = user.find('@')

193

f = user.find('@')

188

if f >= 0:

194

if f >= 0:

189

user = user[:f]

195

user = user[:f]

190

f = user.find('<')

196

f = user.find('<')

191

if f >= 0:

197

if f >= 0:

192

user = user[f + 1:]

198

user = user[f + 1:]

193

f = user.find(' ')

199

f = user.find(' ')

194

if f >= 0:

200

if f >= 0:

195

user = user[:f]

201

user = user[:f]

196

f = user.find('.')

202

f = user.find('.')

197

if f >= 0:

203

if f >= 0:

198

user = user[:f]

204

user = user[:f]

199

return user

205

return user

200

206

201

def emailuser(user):

207

def emailuser(user):

202

"""Return the user portion of an email address."""

208

"""Return the user portion of an email address."""

203

f = user.find('@')

209

f = user.find('@')

204

if f >= 0:

210

if f >= 0:

205

user = user[:f]

211

user = user[:f]

206

f = user.find('<')

212

f = user.find('<')

207

if f >= 0:

213

if f >= 0:

208

user = user[f + 1:]

214

user = user[f + 1:]

209

return user

215

return user

210

216

211

def email(author):

217

def email(author):

212

'''get email of author.'''

218

'''get email of author.'''

213

r = author.find('>')

219

r = author.find('>')

214

if r == -1:

220

if r == -1:

215

r = None

221

r = None

216

return author[author.find('<') + 1:r]

222

return author[author.find('<') + 1:r]

217

223

218

def person(author):

224

def person(author):

219

"""Returns the name before an email address,

225

"""Returns the name before an email address,

220

interpreting it as per RFC 5322

226

interpreting it as per RFC 5322

221

227

222

>>> person(b'foo@bar')

228

>>> person(b'foo@bar')

223

'foo'

229

'foo'

224

>>> person(b'Foo Bar <foo@bar>')

230

>>> person(b'Foo Bar <foo@bar>')

225

'Foo Bar'

231

'Foo Bar'

226

>>> person(b'"Foo Bar" <foo@bar>')

232

>>> person(b'"Foo Bar" <foo@bar>')

227

'Foo Bar'

233

'Foo Bar'

228

>>> person(b'"Foo \"buz\" Bar" <foo@bar>')

234

>>> person(b'"Foo \"buz\" Bar" <foo@bar>')

229

'Foo "buz" Bar'

235

'Foo "buz" Bar'

230

>>> # The following are invalid, but do exist in real-life

236

>>> # The following are invalid, but do exist in real-life

231

...

237

...

232

>>> person(b'Foo "buz" Bar <foo@bar>')

238

>>> person(b'Foo "buz" Bar <foo@bar>')

233

'Foo "buz" Bar'

239

'Foo "buz" Bar'

234

>>> person(b'"Foo Bar <foo@bar>')

240

>>> person(b'"Foo Bar <foo@bar>')

235

'Foo Bar'

241

'Foo Bar'

236

"""

242

"""

237

if '@' not in author:

243

if '@' not in author:

238

return author

244

return author

239

f = author.find('<')

245

f = author.find('<')

240

if f != -1:

246

if f != -1:

241

return author[:f].strip(' "').replace('\\"', '"')

247

return author[:f].strip(' "').replace('\\"', '"')

242

f = author.find('@')

248

f = author.find('@')

243

return author[:f].replace('.', ' ')

249

return author[:f].replace('.', ' ')

244

250

245

@attr.s(hash=True)

251

@attr.s(hash=True)

246

class mailmapping(object):

252

class mailmapping(object):

247

'''Represents a username/email key or value in

253

'''Represents a username/email key or value in

248

a mailmap file'''

254

a mailmap file'''

249

email = attr.ib()

255

email = attr.ib()

250

name = attr.ib(default=None)

256

name = attr.ib(default=None)

251

257

252

def _ismailmaplineinvalid(names, emails):

258

def _ismailmaplineinvalid(names, emails):

253

'''Returns True if the parsed names and emails

259

'''Returns True if the parsed names and emails

254

in a mailmap entry are invalid.

260

in a mailmap entry are invalid.

255

261

256

>>> # No names or emails fails

262

>>> # No names or emails fails

257

>>> names, emails = [], []

263

>>> names, emails = [], []

258

>>> _ismailmaplineinvalid(names, emails)

264

>>> _ismailmaplineinvalid(names, emails)

259

True

265

True

260

>>> # Only one email fails

266

>>> # Only one email fails

261

>>> emails = [b'email@email.com']

267

>>> emails = [b'email@email.com']

262

>>> _ismailmaplineinvalid(names, emails)

268

>>> _ismailmaplineinvalid(names, emails)

263

True

269

True

264

>>> # One email and one name passes

270

>>> # One email and one name passes

265

>>> names = [b'Test Name']

271

>>> names = [b'Test Name']

266

>>> _ismailmaplineinvalid(names, emails)

272

>>> _ismailmaplineinvalid(names, emails)

267

False

273

False

268

>>> # No names but two emails passes

274

>>> # No names but two emails passes

269

>>> names = []

275

>>> names = []

270

>>> emails = [b'proper@email.com', b'commit@email.com']

276

>>> emails = [b'proper@email.com', b'commit@email.com']

271

>>> _ismailmaplineinvalid(names, emails)

277

>>> _ismailmaplineinvalid(names, emails)

272

False

278

False

273

'''

279

'''

274

return not emails or not names and len(emails) < 2

280

return not emails or not names and len(emails) < 2

275

281

276

def parsemailmap(mailmapcontent):

282

def parsemailmap(mailmapcontent):

277

"""Parses data in the .mailmap format

283

"""Parses data in the .mailmap format

278

284

279

>>> mmdata = b"\\n".join([

285

>>> mmdata = b"\\n".join([

280

... b'# Comment',

286

... b'# Comment',

281

... b'Name <commit1@email.xx>',

287

... b'Name <commit1@email.xx>',

282

... b'<name@email.xx> <commit2@email.xx>',

288

... b'<name@email.xx> <commit2@email.xx>',

283

... b'Name <proper@email.xx> <commit3@email.xx>',

289

... b'Name <proper@email.xx> <commit3@email.xx>',

284

... b'Name <proper@email.xx> Commit <commit4@email.xx>',

290

... b'Name <proper@email.xx> Commit <commit4@email.xx>',

285

... ])

291

... ])

286

>>> mm = parsemailmap(mmdata)

292

>>> mm = parsemailmap(mmdata)

287

>>> for key in sorted(mm.keys()):

293

>>> for key in sorted(mm.keys()):

288

... print(key)

294

... print(key)

289

mailmapping(email='commit1@email.xx', name=None)

295

mailmapping(email='commit1@email.xx', name=None)

290

mailmapping(email='commit2@email.xx', name=None)

296

mailmapping(email='commit2@email.xx', name=None)

291

mailmapping(email='commit3@email.xx', name=None)

297

mailmapping(email='commit3@email.xx', name=None)

292

mailmapping(email='commit4@email.xx', name='Commit')

298

mailmapping(email='commit4@email.xx', name='Commit')

293

>>> for val in sorted(mm.values()):

299

>>> for val in sorted(mm.values()):

294

... print(val)

300

... print(val)

295

mailmapping(email='commit1@email.xx', name='Name')

301

mailmapping(email='commit1@email.xx', name='Name')

296

mailmapping(email='name@email.xx', name=None)

302

mailmapping(email='name@email.xx', name=None)

297

mailmapping(email='proper@email.xx', name='Name')

303

mailmapping(email='proper@email.xx', name='Name')

298

mailmapping(email='proper@email.xx', name='Name')

304

mailmapping(email='proper@email.xx', name='Name')

299

"""

305

"""

300

mailmap = {}

306

mailmap = {}

301

307

302

if mailmapcontent is None:

308

if mailmapcontent is None:

303

return mailmap

309

return mailmap

304

310

305

for line in mailmapcontent.splitlines():

311

for line in mailmapcontent.splitlines():

306

312

307

# Don't bother checking the line if it is a comment or

313

# Don't bother checking the line if it is a comment or

308

# is an improperly formed author field

314

# is an improperly formed author field

309

if line.lstrip().startswith('#'):

315

if line.lstrip().startswith('#'):

310

continue

316

continue

311

317

312

# names, emails hold the parsed emails and names for each line

318

# names, emails hold the parsed emails and names for each line

313

# name_builder holds the words in a persons name

319

# name_builder holds the words in a persons name

314

names, emails = [], []

320

names, emails = [], []

315

namebuilder = []

321

namebuilder = []

316

322

317

for element in line.split():

323

for element in line.split():

318

if element.startswith('#'):

324

if element.startswith('#'):

319

# If we reach a comment in the mailmap file, move on

325

# If we reach a comment in the mailmap file, move on

320

break

326

break

321

327

322

elif element.startswith('<') and element.endswith('>'):

328

elif element.startswith('<') and element.endswith('>'):

323

# We have found an email.

329

# We have found an email.

324

# Parse it, and finalize any names from earlier

330

# Parse it, and finalize any names from earlier

325

emails.append(element[1:-1]) # Slice off the "<>"

331

emails.append(element[1:-1]) # Slice off the "<>"

326

332

327

if namebuilder:

333

if namebuilder:

328

names.append(' '.join(namebuilder))

334

names.append(' '.join(namebuilder))

329

namebuilder = []

335

namebuilder = []

330

336

331

# Break if we have found a second email, any other

337

# Break if we have found a second email, any other

332

# data does not fit the spec for .mailmap

338

# data does not fit the spec for .mailmap

333

if len(emails) > 1:

339

if len(emails) > 1:

334

break

340

break

335

341

336

else:

342

else:

337

# We have found another word in the committers name

343

# We have found another word in the committers name

338

namebuilder.append(element)

344

namebuilder.append(element)

339

345

340

# Check to see if we have parsed the line into a valid form

346

# Check to see if we have parsed the line into a valid form

341

# We require at least one email, and either at least one

347

# We require at least one email, and either at least one

342

# name or a second email

348

# name or a second email

343

if _ismailmaplineinvalid(names, emails):

349

if _ismailmaplineinvalid(names, emails):

344

continue

350

continue

345

351

346

mailmapkey = mailmapping(

352

mailmapkey = mailmapping(

347

email=emails[-1],

353

email=emails[-1],

348

name=names[-1] if len(names) == 2 else None,

354

name=names[-1] if len(names) == 2 else None,

349

)

355

)

350

356

351

mailmap[mailmapkey] = mailmapping(

357

mailmap[mailmapkey] = mailmapping(

352

email=emails[0],

358

email=emails[0],

353

name=names[0] if names else None,

359

name=names[0] if names else None,

354

)

360

)

355

361

356

return mailmap

362

return mailmap

357

363

358

def mapname(mailmap, author):

364

def mapname(mailmap, author):

359

"""Returns the author field according to the mailmap cache, or

365

"""Returns the author field according to the mailmap cache, or

360

the original author field.

366

the original author field.

361

367

362

>>> mmdata = b"\\n".join([

368

>>> mmdata = b"\\n".join([

363

... b'# Comment',

369

... b'# Comment',

364

... b'Name <commit1@email.xx>',

370

... b'Name <commit1@email.xx>',

365

... b'<name@email.xx> <commit2@email.xx>',

371

... b'<name@email.xx> <commit2@email.xx>',

366

... b'Name <proper@email.xx> <commit3@email.xx>',

372

... b'Name <proper@email.xx> <commit3@email.xx>',

367

... b'Name <proper@email.xx> Commit <commit4@email.xx>',

373

... b'Name <proper@email.xx> Commit <commit4@email.xx>',

368

... ])

374

... ])

369

>>> m = parsemailmap(mmdata)

375

>>> m = parsemailmap(mmdata)

370

>>> mapname(m, b'Commit <commit1@email.xx>')

376

>>> mapname(m, b'Commit <commit1@email.xx>')

371

'Name <commit1@email.xx>'

377

'Name <commit1@email.xx>'

372

>>> mapname(m, b'Name <commit2@email.xx>')

378

>>> mapname(m, b'Name <commit2@email.xx>')

373

'Name <name@email.xx>'

379

'Name <name@email.xx>'

374

>>> mapname(m, b'Commit <commit3@email.xx>')

380

>>> mapname(m, b'Commit <commit3@email.xx>')

375

'Name <proper@email.xx>'

381

'Name <proper@email.xx>'

376

>>> mapname(m, b'Commit <commit4@email.xx>')

382

>>> mapname(m, b'Commit <commit4@email.xx>')

377

'Name <proper@email.xx>'

383

'Name <proper@email.xx>'

378

>>> mapname(m, b'Unknown Name <unknown@email.com>')

384

>>> mapname(m, b'Unknown Name <unknown@email.com>')

379

'Unknown Name <unknown@email.com>'

385

'Unknown Name <unknown@email.com>'

380

"""

386

"""

381

# If the author field coming in isn't in the correct format,

387

# If the author field coming in isn't in the correct format,

382

# or the mailmap is empty just return the original author field

388

# or the mailmap is empty just return the original author field

383

if not isauthorwellformed(author) or not mailmap:

389

if not isauthorwellformed(author) or not mailmap:

384

return author

390

return author

385

391

386

# Turn the user name into a mailmapping

392

# Turn the user name into a mailmapping

387

commit = mailmapping(name=person(author), email=email(author))

393

commit = mailmapping(name=person(author), email=email(author))

388

394

389

try:

395

try:

390

# Try and use both the commit email and name as the key

396

# Try and use both the commit email and name as the key

391

proper = mailmap[commit]

397

proper = mailmap[commit]

392

398

393

except KeyError:

399

except KeyError:

394

# If the lookup fails, use just the email as the key instead

400

# If the lookup fails, use just the email as the key instead

395

# We call this commit2 as not to erase original commit fields

401

# We call this commit2 as not to erase original commit fields

396

commit2 = mailmapping(email=commit.email)

402

commit2 = mailmapping(email=commit.email)

397

proper = mailmap.get(commit2, mailmapping(None, None))

403

proper = mailmap.get(commit2, mailmapping(None, None))

398

404

399

# Return the author field with proper values filled in

405

# Return the author field with proper values filled in

400

return '%s <%s>' % (

406

return '%s <%s>' % (

401

proper.name if proper.name else commit.name,

407

proper.name if proper.name else commit.name,

402

proper.email if proper.email else commit.email,

408

proper.email if proper.email else commit.email,

403

)

409

)

404

410

405

_correctauthorformat = remod.compile(br'^[^<]+\s\<[^<>]+@[^<>]+\>$')

411

_correctauthorformat = remod.compile(br'^[^<]+\s\<[^<>]+@[^<>]+\>$')

406

412

407

def isauthorwellformed(author):

413

def isauthorwellformed(author):

408

'''Return True if the author field is well formed

414

'''Return True if the author field is well formed

409

(ie "Contributor Name <contrib@email.dom>")

415

(ie "Contributor Name <contrib@email.dom>")

410

416

411

>>> isauthorwellformed(b'Good Author <good@author.com>')

417

>>> isauthorwellformed(b'Good Author <good@author.com>')

412

True

418

True

413

>>> isauthorwellformed(b'Author <good@author.com>')

419

>>> isauthorwellformed(b'Author <good@author.com>')

414

True

420

True

415

>>> isauthorwellformed(b'Bad Author')

421

>>> isauthorwellformed(b'Bad Author')

416

False

422

False

417

>>> isauthorwellformed(b'Bad Author <author@author.com')

423

>>> isauthorwellformed(b'Bad Author <author@author.com')

418

False

424

False

419

>>> isauthorwellformed(b'Bad Author author@author.com')

425

>>> isauthorwellformed(b'Bad Author author@author.com')

420

False

426

False

421

>>> isauthorwellformed(b'<author@author.com>')

427

>>> isauthorwellformed(b'<author@author.com>')

422

False

428

False

423

>>> isauthorwellformed(b'Bad Author <author>')

429

>>> isauthorwellformed(b'Bad Author <author>')

424

False

430

False

425

'''

431

'''

426

return _correctauthorformat.match(author) is not None

432

return _correctauthorformat.match(author) is not None

427

433

428

def ellipsis(text, maxlength=400):

434

def ellipsis(text, maxlength=400):

429

"""Trim string to at most maxlength (default: 400) columns in display."""

435

"""Trim string to at most maxlength (default: 400) columns in display."""

430

return encoding.trim(text, maxlength, ellipsis='...')

436

return encoding.trim(text, maxlength, ellipsis='...')

431

437

432

def escapestr(s):

438

def escapestr(s):

433

if isinstance(s, memoryview):

439

if isinstance(s, memoryview):

434

s = bytes(s)

440

s = bytes(s)

435

# call underlying function of s.encode('string_escape') directly for

441

# call underlying function of s.encode('string_escape') directly for

436

# Python 3 compatibility

442

# Python 3 compatibility

437

return codecs.escape_encode(s)[0]

443

return codecs.escape_encode(s)[0]

438

444

439

def unescapestr(s):

445

def unescapestr(s):

440

return codecs.escape_decode(s)[0]

446

return codecs.escape_decode(s)[0]

441

447

442

def forcebytestr(obj):

448

def forcebytestr(obj):

443

"""Portably format an arbitrary object (e.g. exception) into a byte

449

"""Portably format an arbitrary object (e.g. exception) into a byte

444

string."""

450

string."""

445

try:

451

try:

446

return pycompat.bytestr(obj)

452

return pycompat.bytestr(obj)

447

except UnicodeEncodeError:

453

except UnicodeEncodeError:

448

# non-ascii string, may be lossy

454

# non-ascii string, may be lossy

449

return pycompat.bytestr(encoding.strtolocal(str(obj)))

455

return pycompat.bytestr(encoding.strtolocal(str(obj)))

450

456

451

def uirepr(s):

457

def uirepr(s):

452

# Avoid double backslash in Windows path repr()

458

# Avoid double backslash in Windows path repr()

453

return pycompat.byterepr(pycompat.bytestr(s)).replace(b'\\\\', b'\\')

459

return pycompat.byterepr(pycompat.bytestr(s)).replace(b'\\\\', b'\\')

454

460

455

# delay import of textwrap

461

# delay import of textwrap

456

def _MBTextWrapper(**kwargs):

462

def _MBTextWrapper(**kwargs):

457

class tw(textwrap.TextWrapper):

463

class tw(textwrap.TextWrapper):

458

"""

464

"""

459

Extend TextWrapper for width-awareness.

465

Extend TextWrapper for width-awareness.

460

466

461

Neither number of 'bytes' in any encoding nor 'characters' is

467

Neither number of 'bytes' in any encoding nor 'characters' is

462

appropriate to calculate terminal columns for specified string.

468

appropriate to calculate terminal columns for specified string.

463

469

464

Original TextWrapper implementation uses built-in 'len()' directly,

470

Original TextWrapper implementation uses built-in 'len()' directly,

465

so overriding is needed to use width information of each characters.

471

so overriding is needed to use width information of each characters.

466

472

467

In addition, characters classified into 'ambiguous' width are

473

In addition, characters classified into 'ambiguous' width are

468

treated as wide in East Asian area, but as narrow in other.

474

treated as wide in East Asian area, but as narrow in other.

469

475

470

This requires use decision to determine width of such characters.

476

This requires use decision to determine width of such characters.

471

"""

477

"""

472

def _cutdown(self, ucstr, space_left):

478

def _cutdown(self, ucstr, space_left):

473

l = 0

479

l = 0

474

colwidth = encoding.ucolwidth

480

colwidth = encoding.ucolwidth

475

for i in pycompat.xrange(len(ucstr)):

481

for i in pycompat.xrange(len(ucstr)):

476

l += colwidth(ucstr[i])

482

l += colwidth(ucstr[i])

477

if space_left < l:

483

if space_left < l:

478

return (ucstr[:i], ucstr[i:])

484

return (ucstr[:i], ucstr[i:])

479

return ucstr, ''

485

return ucstr, ''

480

486

481

# overriding of base class

487

# overriding of base class

482

def _handle_long_word(self, reversed_chunks, cur_line, cur_len, width):

488

def _handle_long_word(self, reversed_chunks, cur_line, cur_len, width):

483

space_left = max(width - cur_len, 1)

489

space_left = max(width - cur_len, 1)

484

490

485

if self.break_long_words:

491

if self.break_long_words:

486

cut, res = self._cutdown(reversed_chunks[-1], space_left)

492

cut, res = self._cutdown(reversed_chunks[-1], space_left)

487

cur_line.append(cut)

493

cur_line.append(cut)

488

reversed_chunks[-1] = res

494

reversed_chunks[-1] = res

489

elif not cur_line:

495

elif not cur_line:

490

cur_line.append(reversed_chunks.pop())

496

cur_line.append(reversed_chunks.pop())

491

497

492

# this overriding code is imported from TextWrapper of Python 2.6

498

# this overriding code is imported from TextWrapper of Python 2.6

493

# to calculate columns of string by 'encoding.ucolwidth()'

499

# to calculate columns of string by 'encoding.ucolwidth()'

494

def _wrap_chunks(self, chunks):

500

def _wrap_chunks(self, chunks):

495

colwidth = encoding.ucolwidth

501

colwidth = encoding.ucolwidth

496

502

497

lines = []

503

lines = []

498

if self.width <= 0:

504

if self.width <= 0:

499

raise ValueError("invalid width %r (must be > 0)" % self.width)

505

raise ValueError("invalid width %r (must be > 0)" % self.width)

500

506

501

# Arrange in reverse order so items can be efficiently popped

507

# Arrange in reverse order so items can be efficiently popped

502

# from a stack of chucks.

508

# from a stack of chucks.

503

chunks.reverse()

509

chunks.reverse()

504

510

505

while chunks:

511

while chunks:

506

512

507

# Start the list of chunks that will make up the current line.

513

# Start the list of chunks that will make up the current line.

508

# cur_len is just the length of all the chunks in cur_line.

514

# cur_len is just the length of all the chunks in cur_line.

509

cur_line = []

515

cur_line = []

510

cur_len = 0

516

cur_len = 0

511

517

512

# Figure out which static string will prefix this line.

518

# Figure out which static string will prefix this line.

513

if lines:

519

if lines:

514

indent = self.subsequent_indent

520

indent = self.subsequent_indent

515

else:

521

else:

516

indent = self.initial_indent

522

indent = self.initial_indent

517

523

518

# Maximum width for this line.

524

# Maximum width for this line.

519

width = self.width - len(indent)

525

width = self.width - len(indent)

520

526

521

# First chunk on line is whitespace -- drop it, unless this

527

# First chunk on line is whitespace -- drop it, unless this

522

# is the very beginning of the text (i.e. no lines started yet).

528

# is the very beginning of the text (i.e. no lines started yet).

523

if self.drop_whitespace and chunks[-1].strip() == r'' and lines:

529

if self.drop_whitespace and chunks[-1].strip() == r'' and lines:

524

del chunks[-1]

530

del chunks[-1]

525

531

526

while chunks:

532

while chunks:

527

l = colwidth(chunks[-1])

533

l = colwidth(chunks[-1])

528

534

529

# Can at least squeeze this chunk onto the current line.

535

# Can at least squeeze this chunk onto the current line.

530

if cur_len + l <= width:

536

if cur_len + l <= width:

531

cur_line.append(chunks.pop())

537

cur_line.append(chunks.pop())

532

cur_len += l

538

cur_len += l

533

539

534

# Nope, this line is full.

540

# Nope, this line is full.

535

else:

541

else:

536

break

542

break

537

543

538

# The current line is full, and the next chunk is too big to

544

# The current line is full, and the next chunk is too big to

539

# fit on *any* line (not just this one).

545

# fit on *any* line (not just this one).

540

if chunks and colwidth(chunks[-1]) > width:

546

if chunks and colwidth(chunks[-1]) > width:

541

self._handle_long_word(chunks, cur_line, cur_len, width)

547

self._handle_long_word(chunks, cur_line, cur_len, width)

542

548

543

# If the last chunk on this line is all whitespace, drop it.

549

# If the last chunk on this line is all whitespace, drop it.

544

if (self.drop_whitespace and

550

if (self.drop_whitespace and

545

cur_line and cur_line[-1].strip() == r''):

551

cur_line and cur_line[-1].strip() == r''):

546

del cur_line[-1]

552

del cur_line[-1]

547

553

548

# Convert current line back to a string and store it in list

554

# Convert current line back to a string and store it in list

549

# of all lines (return value).

555

# of all lines (return value).

550

if cur_line:

556

if cur_line:

551

lines.append(indent + r''.join(cur_line))

557

lines.append(indent + r''.join(cur_line))

552

558

553

return lines

559

return lines

554

560

555

global _MBTextWrapper

561

global _MBTextWrapper

556

_MBTextWrapper = tw

562

_MBTextWrapper = tw

557

return tw(**kwargs)

563

return tw(**kwargs)

558

564

559

def wrap(line, width, initindent='', hangindent=''):

565

def wrap(line, width, initindent='', hangindent=''):

560

maxindent = max(len(hangindent), len(initindent))

566

maxindent = max(len(hangindent), len(initindent))

561

if width <= maxindent:

567

if width <= maxindent:

562

# adjust for weird terminal size

568

# adjust for weird terminal size

563

width = max(78, maxindent + 1)

569

width = max(78, maxindent + 1)

564

line = line.decode(pycompat.sysstr(encoding.encoding),

570

line = line.decode(pycompat.sysstr(encoding.encoding),

565

pycompat.sysstr(encoding.encodingmode))

571

pycompat.sysstr(encoding.encodingmode))

566

initindent = initindent.decode(pycompat.sysstr(encoding.encoding),

572

initindent = initindent.decode(pycompat.sysstr(encoding.encoding),

567

pycompat.sysstr(encoding.encodingmode))

573

pycompat.sysstr(encoding.encodingmode))

568

hangindent = hangindent.decode(pycompat.sysstr(encoding.encoding),

574

hangindent = hangindent.decode(pycompat.sysstr(encoding.encoding),

569

pycompat.sysstr(encoding.encodingmode))

575

pycompat.sysstr(encoding.encodingmode))

570

wrapper = _MBTextWrapper(width=width,

576

wrapper = _MBTextWrapper(width=width,

571

initial_indent=initindent,

577

initial_indent=initindent,

572

subsequent_indent=hangindent)

578

subsequent_indent=hangindent)

573

return wrapper.fill(line).encode(pycompat.sysstr(encoding.encoding))

579

return wrapper.fill(line).encode(pycompat.sysstr(encoding.encoding))

574

580

575

_booleans = {'1': True, 'yes': True, 'true': True, 'on': True, 'always': True,

581

_booleans = {'1': True, 'yes': True, 'true': True, 'on': True, 'always': True,

576

'0': False, 'no': False, 'false': False, 'off': False,

582

'0': False, 'no': False, 'false': False, 'off': False,

577

'never': False}

583

'never': False}

578

584

579

def parsebool(s):

585

def parsebool(s):

580

"""Parse s into a boolean.

586

"""Parse s into a boolean.

581

587

582

If s is not a valid boolean, returns None.

588

If s is not a valid boolean, returns None.

583

"""

589

"""

584

return _booleans.get(s.lower(), None)

590

return _booleans.get(s.lower(), None)

585

591

586

def evalpythonliteral(s):

592

def evalpythonliteral(s):

587

"""Evaluate a string containing a Python literal expression"""

593

"""Evaluate a string containing a Python literal expression"""

588

# We could backport our tokenizer hack to rewrite '' to u'' if we want

594

# We could backport our tokenizer hack to rewrite '' to u'' if we want

589

if pycompat.ispy3:

595

if pycompat.ispy3:

590

return ast.literal_eval(s.decode('latin1'))

596

return ast.literal_eval(s.decode('latin1'))

591

return ast.literal_eval(s)

597

return ast.literal_eval(s)

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages

             # stringutil.py - utility for generic string formatting, parsing, etc.
             #
             #  Copyright 2005 K. Thananchayan <thananck@yahoo.com>
             #  Copyright 2005-2007 Matt Mackall <mpm@selenic.com>
             #  Copyright 2006 Vadim Gelfer <vadim.gelfer@gmail.com>
             #
             # This software may be used and distributed according to the terms of the
             # GNU General Public License version 2 or any later version.
             from __future__ import absolute_import
             import ast
             import codecs
             import re as remod
             import textwrap
             import types
             from ..i18n import _
             from ..thirdparty import attr
             from .. import (
                 encoding,
                 error,
                 pycompat,
             )
             # regex special chars pulled from https://bugs.python.org/issue29995
             # which was part of Python 3.7.
             _respecial = pycompat.bytestr(b'()[]{}?*+-|^$\\.&~# \t\n\r\v\f')
             _regexescapemap = {ord(i): (b'\\' + i).decode('latin1') for i in _respecial}
             def reescape(pat):
                 """Drop-in replacement for re.escape."""
                 # NOTE: it is intentional that this works on unicodes and not
                 # bytes, as it's only possible to do the escaping with
                 # unicode.translate, not bytes.translate. Sigh.
                 wantuni = True
                 if isinstance(pat, bytes):
                     wantuni = False
                     pat = pat.decode('latin1')
                 pat = pat.translate(_regexescapemap)
                 if wantuni:
                     return pat
                 return pat.encode('latin1')
             def pprint(o, bprefix=False):
                 """Pretty print an object."""
+                return b''.join(pprintgen(o, bprefix=bprefix))
+            def pprintgen(o, bprefix=False):
+                """Pretty print an object to a generator of atoms."""
                 if isinstance(o, bytes):
                     if bprefix:
-                        return "b'%s'" % escapestr(o)
+                        yield "b'%s'" % escapestr(o)
-                    return "'%s'" % escapestr(o)
+                    else:
+                        yield "'%s'" % escapestr(o)
                 elif isinstance(o, bytearray):
                     # codecs.escape_encode() can't handle bytearray, so escapestr fails
                     # without coercion.
-                    return "bytearray['%s']" % escapestr(bytes(o))
+                    yield "bytearray['%s']" % escapestr(bytes(o))
                 elif isinstance(o, list):
-                    return '[%s]' % (b', '.join(pprint(a, bprefix=bprefix) for a in o))
+                    yield '[%s]' % (b', '.join(pprint(a, bprefix=bprefix) for a in o))
                 elif isinstance(o, dict):
-                    return '{%s}' % (b', '.join(
+                    yield '{%s}' % (b', '.join(
                         '%s: %s' % (pprint(k, bprefix=bprefix),
                                     pprint(v, bprefix=bprefix))
                         for k, v in sorted(o.items())))
                 elif isinstance(o, set):
-                    return 'set([%s])' % (b', '.join(
+                    yield 'set([%s])' % (b', '.join(
                         pprint(k, bprefix=bprefix) for k in sorted(o)))
                 elif isinstance(o, tuple):
-                    return '(%s)' % (b', '.join(pprint(a, bprefix=bprefix) for a in o))
+                    yield '(%s)' % (b', '.join(pprint(a, bprefix=bprefix) for a in o))
                 elif isinstance(o, types.GeneratorType):
-                    return 'gen[%s]' % (b', '.join(pprint(a, bprefix=bprefix) for a in o))
+                    yield 'gen[%s]' % (b', '.join(pprint(a, bprefix=bprefix) for a in o))
                 else:
-                    return pycompat.byterepr(o)
+                    yield pycompat.byterepr(o)
             def prettyrepr(o):
                 """Pretty print a representation of a possibly-nested object"""
                 lines = []
                 rs = pycompat.byterepr(o)
                 p0 = p1 = 0
                 while p0 < len(rs):
                     # '... field=<type ... field=<type ...'
                     #      ~~~~~~~~~~~~~~~~
                     #      p0    p1        q0    q1
                     q0 = -1
                     q1 = rs.find('<', p1 + 1)
                     if q1 < 0:
                         q1 = len(rs)
                     elif q1 > p1 + 1 and rs.startswith('=', q1 - 1):
                         # backtrack for ' field=<'
                         q0 = rs.rfind(' ', p1 + 1, q1 - 1)
                     if q0 < 0:
                         q0 = q1
                     else:
                         q0 += 1  # skip ' '
                     l = rs.count('<', 0, p0) - rs.count('>', 0, p0)
                     assert l >= 0
                     lines.append((l, rs[p0:q0].rstrip()))
                     p0, p1 = q0, q1
                 return '\n'.join('  ' * l + s for l, s in lines)
             def buildrepr(r):
                 """Format an optional printable representation from unexpanded bits
                 ========  =================================
                 type(r)   example
                 ========  =================================
                 tuple     ('<not %r>', other)
                 bytes     '<branch closed>'
                 callable  lambda: '<branch %r>' % sorted(b)
                 object    other
                 ========  =================================
                 """
                 if r is None:
                     return ''
                 elif isinstance(r, tuple):
                     return r[0] % pycompat.rapply(pycompat.maybebytestr, r[1:])
                 elif isinstance(r, bytes):
                     return r
                 elif callable(r):
                     return r()
                 else:
                     return pprint(r)
             def binary(s):
                 """return true if a string is binary data"""
                 return bool(s and '\0' in s)
             def stringmatcher(pattern, casesensitive=True):
                 """
                 accepts a string, possibly starting with 're:' or 'literal:' prefix.
                 returns the matcher name, pattern, and matcher function.
                 missing or unknown prefixes are treated as literal matches.
                 helper for tests:
                 >>> def test(pattern, *tests):
                 ...     kind, pattern, matcher = stringmatcher(pattern)
                 ...     return (kind, pattern, [bool(matcher(t)) for t in tests])
                 >>> def itest(pattern, *tests):
                 ...     kind, pattern, matcher = stringmatcher(pattern, casesensitive=False)
                 ...     return (kind, pattern, [bool(matcher(t)) for t in tests])
                 exact matching (no prefix):
                 >>> test(b'abcdefg', b'abc', b'def', b'abcdefg')
                 ('literal', 'abcdefg', [False, False, True])
                 regex matching ('re:' prefix)
                 >>> test(b're:a.+b', b'nomatch', b'fooadef', b'fooadefbar')
                 ('re', 'a.+b', [False, False, True])
                 force exact matches ('literal:' prefix)
                 >>> test(b'literal:re:foobar', b'foobar', b're:foobar')
                 ('literal', 're:foobar', [False, True])
                 unknown prefixes are ignored and treated as literals
                 >>> test(b'foo:bar', b'foo', b'bar', b'foo:bar')
                 ('literal', 'foo:bar', [False, False, True])
                 case insensitive regex matches
                 >>> itest(b're:A.+b', b'nomatch', b'fooadef', b'fooadefBar')
                 ('re', 'A.+b', [False, False, True])
                 case insensitive literal matches
                 >>> itest(b'ABCDEFG', b'abc', b'def', b'abcdefg')
                 ('literal', 'ABCDEFG', [False, False, True])
                 """
                 if pattern.startswith('re:'):
                     pattern = pattern[3:]
                     try:
                         flags = 0
                         if not casesensitive:
                             flags = remod.I
                         regex = remod.compile(pattern, flags)
                     except remod.error as e:
                         raise error.ParseError(_('invalid regular expression: %s')
                                                % e)
                     return 're', pattern, regex.search
                 elif pattern.startswith('literal:'):
                     pattern = pattern[8:]
                 match = pattern.__eq__
                 if not casesensitive:
                     ipat = encoding.lower(pattern)
                     match = lambda s: ipat == encoding.lower(s)
                 return 'literal', pattern, match
             def shortuser(user):
                 """Return a short representation of a user name or email address."""
                 f = user.find('@')
                 if f >= 0:
                     user = user[:f]
                 f = user.find('<')
                 if f >= 0:
                     user = user[f + 1:]
                 f = user.find(' ')
                 if f >= 0:
                     user = user[:f]
                 f = user.find('.')
                 if f >= 0:
                     user = user[:f]
                 return user
             def emailuser(user):
                 """Return the user portion of an email address."""
                 f = user.find('@')
                 if f >= 0:
                     user = user[:f]
                 f = user.find('<')
                 if f >= 0:
                     user = user[f + 1:]
                 return user
             def email(author):
                 '''get email of author.'''
                 r = author.find('>')
                 if r == -1:
                     r = None
                 return author[author.find('<') + 1:r]
             def person(author):
                 """Returns the name before an email address,
                 interpreting it as per RFC 5322
                 >>> person(b'foo@bar')
                 'foo'
                 >>> person(b'Foo Bar <foo@bar>')
                 'Foo Bar'
                 >>> person(b'"Foo Bar" <foo@bar>')
                 'Foo Bar'
                 >>> person(b'"Foo \"buz\" Bar" <foo@bar>')
                 'Foo "buz" Bar'
                 >>> # The following are invalid, but do exist in real-life
                 ...
                 >>> person(b'Foo "buz" Bar <foo@bar>')
                 'Foo "buz" Bar'
                 >>> person(b'"Foo Bar <foo@bar>')
                 'Foo Bar'
                 """
                 if '@' not in author:
                     return author
                 f = author.find('<')
                 if f != -1:
                     return author[:f].strip(' "').replace('\\"', '"')
                 f = author.find('@')
                 return author[:f].replace('.', ' ')
             @attr.s(hash=True)
             class mailmapping(object):
                 '''Represents a username/email key or value in
                 a mailmap file'''
                 email = attr.ib()
                 name = attr.ib(default=None)
             def _ismailmaplineinvalid(names, emails):
                 '''Returns True if the parsed names and emails
                 in a mailmap entry are invalid.
                 >>> # No names or emails fails
                 >>> names, emails = [], []
                 >>> _ismailmaplineinvalid(names, emails)
                 True
                 >>> # Only one email fails
                 >>> emails = [b'email@email.com']
                 >>> _ismailmaplineinvalid(names, emails)
                 True
                 >>> # One email and one name passes
                 >>> names = [b'Test Name']
                 >>> _ismailmaplineinvalid(names, emails)
                 False
                 >>> # No names but two emails passes
                 >>> names = []
                 >>> emails = [b'proper@email.com', b'commit@email.com']
                 >>> _ismailmaplineinvalid(names, emails)
                 False
                 '''
                 return not emails or not names and len(emails) < 2
             def parsemailmap(mailmapcontent):
                 """Parses data in the .mailmap format
                 >>> mmdata = b"\\n".join([
                 ... b'# Comment',
                 ... b'Name <commit1@email.xx>',
                 ... b'<name@email.xx> <commit2@email.xx>',
                 ... b'Name <proper@email.xx> <commit3@email.xx>',
                 ... b'Name <proper@email.xx> Commit <commit4@email.xx>',
                 ... ])
                 >>> mm = parsemailmap(mmdata)
                 >>> for key in sorted(mm.keys()):
                 ...     print(key)
                 mailmapping(email='commit1@email.xx', name=None)
                 mailmapping(email='commit2@email.xx', name=None)
                 mailmapping(email='commit3@email.xx', name=None)
                 mailmapping(email='commit4@email.xx', name='Commit')
                 >>> for val in sorted(mm.values()):
                 ...     print(val)
                 mailmapping(email='commit1@email.xx', name='Name')
                 mailmapping(email='name@email.xx', name=None)
                 mailmapping(email='proper@email.xx', name='Name')
                 mailmapping(email='proper@email.xx', name='Name')
                 """
                 mailmap = {}
                 if mailmapcontent is None:
                     return mailmap
                 for line in mailmapcontent.splitlines():
                     # Don't bother checking the line if it is a comment or
                     # is an improperly formed author field
                     if line.lstrip().startswith('#'):
                         continue
                     # names, emails hold the parsed emails and names for each line
                     # name_builder holds the words in a persons name
                     names, emails = [], []
                     namebuilder = []
                     for element in line.split():
                         if element.startswith('#'):
                             # If we reach a comment in the mailmap file, move on
                             break
                         elif element.startswith('<') and element.endswith('>'):
                             # We have found an email.
                             # Parse it, and finalize any names from earlier
                             emails.append(element[1:-1])  # Slice off the "<>"
                             if namebuilder:
                                 names.append(' '.join(namebuilder))
                                 namebuilder = []
                             # Break if we have found a second email, any other
                             # data does not fit the spec for .mailmap
                             if len(emails) > 1:
                                 break
                         else:
                             # We have found another word in the committers name
                             namebuilder.append(element)
                     # Check to see if we have parsed the line into a valid form
                     # We require at least one email, and either at least one
                     # name or a second email
                     if _ismailmaplineinvalid(names, emails):
                         continue
                     mailmapkey = mailmapping(
                         email=emails[-1],
                         name=names[-1] if len(names) == 2 else None,
                     )
                     mailmap[mailmapkey] = mailmapping(
                         email=emails[0],
                         name=names[0] if names else None,
                     )
                 return mailmap
             def mapname(mailmap, author):
                 """Returns the author field according to the mailmap cache, or
                 the original author field.
                 >>> mmdata = b"\\n".join([
                 ...     b'# Comment',
                 ...     b'Name <commit1@email.xx>',
                 ...     b'<name@email.xx> <commit2@email.xx>',
                 ...     b'Name <proper@email.xx> <commit3@email.xx>',
                 ...     b'Name <proper@email.xx> Commit <commit4@email.xx>',
                 ... ])
                 >>> m = parsemailmap(mmdata)
                 >>> mapname(m, b'Commit <commit1@email.xx>')
                 'Name <commit1@email.xx>'
                 >>> mapname(m, b'Name <commit2@email.xx>')
                 'Name <name@email.xx>'
                 >>> mapname(m, b'Commit <commit3@email.xx>')
                 'Name <proper@email.xx>'
                 >>> mapname(m, b'Commit <commit4@email.xx>')
                 'Name <proper@email.xx>'
                 >>> mapname(m, b'Unknown Name <unknown@email.com>')
                 'Unknown Name <unknown@email.com>'
                 """
                 # If the author field coming in isn't in the correct format,
                 # or the mailmap is empty just return the original author field
                 if not isauthorwellformed(author) or not mailmap:
                     return author
                 # Turn the user name into a mailmapping
                 commit = mailmapping(name=person(author), email=email(author))
                 try:
                     # Try and use both the commit email and name as the key
                     proper = mailmap[commit]
                 except KeyError:
                     # If the lookup fails, use just the email as the key instead
                     # We call this commit2 as not to erase original commit fields
                     commit2 = mailmapping(email=commit.email)
                     proper = mailmap.get(commit2, mailmapping(None, None))
                 # Return the author field with proper values filled in
                 return '%s <%s>' % (
                     proper.name if proper.name else commit.name,
                     proper.email if proper.email else commit.email,
                 )
             _correctauthorformat = remod.compile(br'^[^<]+\s\<[^<>]+@[^<>]+\>$')
             def isauthorwellformed(author):
                 '''Return True if the author field is well formed
                 (ie "Contributor Name <contrib@email.dom>")
                 >>> isauthorwellformed(b'Good Author <good@author.com>')
                 True
                 >>> isauthorwellformed(b'Author <good@author.com>')
                 True
                 >>> isauthorwellformed(b'Bad Author')
                 False
                 >>> isauthorwellformed(b'Bad Author <author@author.com')
                 False
                 >>> isauthorwellformed(b'Bad Author author@author.com')
                 False
                 >>> isauthorwellformed(b'<author@author.com>')
                 False
                 >>> isauthorwellformed(b'Bad Author <author>')
                 False
                 '''
                 return _correctauthorformat.match(author) is not None
             def ellipsis(text, maxlength=400):
                 """Trim string to at most maxlength (default: 400) columns in display."""
                 return encoding.trim(text, maxlength, ellipsis='...')
             def escapestr(s):
                 if isinstance(s, memoryview):
                     s = bytes(s)
                 # call underlying function of s.encode('string_escape') directly for
                 # Python 3 compatibility
                 return codecs.escape_encode(s)[0]
             def unescapestr(s):
                 return codecs.escape_decode(s)[0]
             def forcebytestr(obj):
                 """Portably format an arbitrary object (e.g. exception) into a byte
                 string."""
                 try:
                     return pycompat.bytestr(obj)
                 except UnicodeEncodeError:
                     # non-ascii string, may be lossy
                     return pycompat.bytestr(encoding.strtolocal(str(obj)))
             def uirepr(s):
                 # Avoid double backslash in Windows path repr()
                 return pycompat.byterepr(pycompat.bytestr(s)).replace(b'\\\\', b'\\')
             # delay import of textwrap
             def _MBTextWrapper(**kwargs):
                 class tw(textwrap.TextWrapper):
                     """
                     Extend TextWrapper for width-awareness.
                     Neither number of 'bytes' in any encoding nor 'characters' is
                     appropriate to calculate terminal columns for specified string.
                     Original TextWrapper implementation uses built-in 'len()' directly,
                     so overriding is needed to use width information of each characters.
                     In addition, characters classified into 'ambiguous' width are
                     treated as wide in East Asian area, but as narrow in other.
                     This requires use decision to determine width of such characters.
                     """
                     def _cutdown(self, ucstr, space_left):
                         l = 0
                         colwidth = encoding.ucolwidth
                         for i in pycompat.xrange(len(ucstr)):
                             l += colwidth(ucstr[i])
                             if space_left < l:
                                 return (ucstr[:i], ucstr[i:])
                         return ucstr, ''
                     # overriding of base class
                     def _handle_long_word(self, reversed_chunks, cur_line, cur_len, width):
                         space_left = max(width - cur_len, 1)
                         if self.break_long_words:
                             cut, res = self._cutdown(reversed_chunks[-1], space_left)
                             cur_line.append(cut)
                             reversed_chunks[-1] = res
                         elif not cur_line:
                             cur_line.append(reversed_chunks.pop())
                     # this overriding code is imported from TextWrapper of Python 2.6
                     # to calculate columns of string by 'encoding.ucolwidth()'
                     def _wrap_chunks(self, chunks):
                         colwidth = encoding.ucolwidth
                         lines = []
                         if self.width <= 0:
                             raise ValueError("invalid width %r (must be > 0)" % self.width)
                         # Arrange in reverse order so items can be efficiently popped
                         # from a stack of chucks.
                         chunks.reverse()
                         while chunks:
                             # Start the list of chunks that will make up the current line.
                             # cur_len is just the length of all the chunks in cur_line.
                             cur_line = []
                             cur_len = 0
                             # Figure out which static string will prefix this line.
                             if lines:
                                 indent = self.subsequent_indent
                             else:
                                 indent = self.initial_indent
                             # Maximum width for this line.
                             width = self.width - len(indent)
                             # First chunk on line is whitespace -- drop it, unless this
                             # is the very beginning of the text (i.e. no lines started yet).
                             if self.drop_whitespace and chunks[-1].strip() == r'' and lines:
                                 del chunks[-1]
                             while chunks:
                                 l = colwidth(chunks[-1])
                                 # Can at least squeeze this chunk onto the current line.
                                 if cur_len + l <= width:
                                     cur_line.append(chunks.pop())
                                     cur_len += l
                                 # Nope, this line is full.
                                 else:
                                     break
                             # The current line is full, and the next chunk is too big to
                             # fit on *any* line (not just this one).
                             if chunks and colwidth(chunks[-1]) > width:
                                 self._handle_long_word(chunks, cur_line, cur_len, width)
                             # If the last chunk on this line is all whitespace, drop it.
                             if (self.drop_whitespace and
                                 cur_line and cur_line[-1].strip() == r''):
                                 del cur_line[-1]
                             # Convert current line back to a string and store it in list
                             # of all lines (return value).
                             if cur_line:
                                 lines.append(indent + r''.join(cur_line))
                         return lines
                 global _MBTextWrapper
                 _MBTextWrapper = tw
                 return tw(**kwargs)
             def wrap(line, width, initindent='', hangindent=''):
                 maxindent = max(len(hangindent), len(initindent))
                 if width <= maxindent:
                     # adjust for weird terminal size
                     width = max(78, maxindent + 1)
                 line = line.decode(pycompat.sysstr(encoding.encoding),
                                    pycompat.sysstr(encoding.encodingmode))
                 initindent = initindent.decode(pycompat.sysstr(encoding.encoding),
                                                pycompat.sysstr(encoding.encodingmode))
                 hangindent = hangindent.decode(pycompat.sysstr(encoding.encoding),
                                                pycompat.sysstr(encoding.encodingmode))
                 wrapper = _MBTextWrapper(width=width,
                                          initial_indent=initindent,
                                          subsequent_indent=hangindent)
                 return wrapper.fill(line).encode(pycompat.sysstr(encoding.encoding))
             _booleans = {'1': True, 'yes': True, 'true': True, 'on': True, 'always': True,
                          '0': False, 'no': False, 'false': False, 'off': False,
                          'never': False}
             def parsebool(s):
                 """Parse s into a boolean.
                 If s is not a valid boolean, returns None.
                 """
                 return _booleans.get(s.lower(), None)
             def evalpythonliteral(s):
                 """Evaluate a string containing a Python literal expression"""
                 # We could backport our tokenizer hack to rewrite '' to u'' if we want
                 if pycompat.ispy3:
                     return ast.literal_eval(s.decode('latin1'))
                 return ast.literal_eval(s)