upstream/mercurial-mirror Commit - r37388:b6de372b

1

# mdiff.py - diff and patch routines for mercurial

1

# mdiff.py - diff and patch routines for mercurial

2

#

2

#

3

4

#

4

#

5

# This software may be used and distributed according to the terms of the

5

# This software may be used and distributed according to the terms of the

6

# GNU General Public License version 2 or any later version.

6

# GNU General Public License version 2 or any later version.

7

8

from __future__ import absolute_import

8

from __future__ import absolute_import

9

10

import re

10

import re

11

import struct

11

import struct

12

import zlib

12

import zlib

13

14

from .i18n import _

14

from .i18n import _

15

from . import (

15

from . import (

16

encoding,

16

encoding,

17

error,

17

error,

18

policy,

18

policy,

19

pycompat,

19

pycompat,

20

util,

20

util,

21

)

21

)

22

from .utils import dateutil

22

from .utils import dateutil

23

24

_missing_newline_marker = "\\ No newline at end of file\n"

24

_missing_newline_marker = "\\ No newline at end of file\n"

25

26

bdiff = policy.importmod(r'bdiff')

26

bdiff = policy.importmod(r'bdiff')

27

mpatch = policy.importmod(r'mpatch')

27

mpatch = policy.importmod(r'mpatch')

28

29

blocks = bdiff.blocks

29

blocks = bdiff.blocks

30

fixws = bdiff.fixws

30

fixws = bdiff.fixws

31

patches = mpatch.patches

31

patches = mpatch.patches

32

patchedsize = mpatch.patchedsize

32

patchedsize = mpatch.patchedsize

33

textdiff = bdiff.bdiff

33

textdiff = bdiff.bdiff

34

splitnewlines = bdiff.splitnewlines

34

splitnewlines = bdiff.splitnewlines

35

36

class diffopts(object):

36

class diffopts(object):

37

'''context is the number of context lines

37

'''context is the number of context lines

38

text treats all files as text

38

text treats all files as text

39

showfunc enables diff -p output

39

showfunc enables diff -p output

40

git enables the git extended patch format

40

git enables the git extended patch format

41

nodates removes dates from diff headers

41

nodates removes dates from diff headers

42

nobinary ignores binary files

42

nobinary ignores binary files

43

noprefix disables the 'a/' and 'b/' prefixes (ignored in plain mode)

43

noprefix disables the 'a/' and 'b/' prefixes (ignored in plain mode)

44

ignorews ignores all whitespace changes in the diff

44

ignorews ignores all whitespace changes in the diff

45

ignorewsamount ignores changes in the amount of whitespace

45

ignorewsamount ignores changes in the amount of whitespace

46

ignoreblanklines ignores changes whose lines are all blank

46

ignoreblanklines ignores changes whose lines are all blank

47

upgrade generates git diffs to avoid data loss

47

upgrade generates git diffs to avoid data loss

48

'''

48

'''

49

50

defaults = {

50

defaults = {

51

'context': 3,

51

'context': 3,

52

'text': False,

52

'text': False,

53

'showfunc': False,

53

'showfunc': False,

54

'git': False,

54

'git': False,

55

'nodates': False,

55

'nodates': False,

56

'nobinary': False,

56

'nobinary': False,

57

'noprefix': False,

57

'noprefix': False,

58

'index': 0,

58

'index': 0,

59

'ignorews': False,

59

'ignorews': False,

60

'ignorewsamount': False,

60

'ignorewsamount': False,

61

'ignorewseol': False,

61

'ignorewseol': False,

62

'ignoreblanklines': False,

62

'ignoreblanklines': False,

63

'upgrade': False,

63

'upgrade': False,

64

'showsimilarity': False,

64

'showsimilarity': False,

65

'worddiff': False,

65

'worddiff': False,

66

'xdiff': False,

66

'xdiff': False,

67

}

67

}

68

69

def __init__(self, **opts):

69

def __init__(self, **opts):

70

opts = pycompat.byteskwargs(opts)

70

opts = pycompat.byteskwargs(opts)

71

for k in self.defaults.keys():

71

for k in self.defaults.keys():

72

v = opts.get(k)

72

v = opts.get(k)

73

if v is None:

73

if v is None:

74

v = self.defaults[k]

74

v = self.defaults[k]

75

setattr(self, k, v)

75

setattr(self, k, v)

76

77

try:

77

try:

78

self.context = int(self.context)

78

self.context = int(self.context)

79

except ValueError:

79

except ValueError:

80

raise error.Abort(_('diff context lines count must be '

80

raise error.Abort(_('diff context lines count must be '

81

'an integer, not %r') % ~~self~~.~~context~~)

81

'an integer, not %r') %

82

pycompat.bytestr(self.context))

82

83

def copy(self, **kwargs):

84

def copy(self, **kwargs):

84

opts = dict((k, getattr(self, k)) for k in self.defaults)

85

opts = dict((k, getattr(self, k)) for k in self.defaults)

85

opts = pycompat.strkwargs(opts)

86

opts = pycompat.strkwargs(opts)

86

opts.update(kwargs)

87

opts.update(kwargs)

87

return diffopts(**opts)

88

return diffopts(**opts)

88

89

defaultopts = diffopts()

90

defaultopts = diffopts()

90

91

def wsclean(opts, text, blank=True):

92

def wsclean(opts, text, blank=True):

92

if opts.ignorews:

93

if opts.ignorews:

93

text = bdiff.fixws(text, 1)

94

text = bdiff.fixws(text, 1)

94

elif opts.ignorewsamount:

95

elif opts.ignorewsamount:

95

text = bdiff.fixws(text, 0)

96

text = bdiff.fixws(text, 0)

96

if blank and opts.ignoreblanklines:

97

if blank and opts.ignoreblanklines:

97

text = re.sub('\n+', '\n', text).strip('\n')

98

text = re.sub('\n+', '\n', text).strip('\n')

98

if opts.ignorewseol:

99

if opts.ignorewseol:

99

text = re.sub(br'[ \t\r\f]+\n', r'\n', text)

100

text = re.sub(br'[ \t\r\f]+\n', r'\n', text)

100

return text

101

return text

101

102

def splitblock(base1, lines1, base2, lines2, opts):

103

def splitblock(base1, lines1, base2, lines2, opts):

103

# The input lines matches except for interwoven blank lines. We

104

# The input lines matches except for interwoven blank lines. We

104

# transform it into a sequence of matching blocks and blank blocks.

105

# transform it into a sequence of matching blocks and blank blocks.

105

lines1 = [(wsclean(opts, l) and 1 or 0) for l in lines1]

106

lines1 = [(wsclean(opts, l) and 1 or 0) for l in lines1]

106

lines2 = [(wsclean(opts, l) and 1 or 0) for l in lines2]

107

lines2 = [(wsclean(opts, l) and 1 or 0) for l in lines2]

107

s1, e1 = 0, len(lines1)

108

s1, e1 = 0, len(lines1)

108

s2, e2 = 0, len(lines2)

109

s2, e2 = 0, len(lines2)

109

while s1 < e1 or s2 < e2:

110

while s1 < e1 or s2 < e2:

110

i1, i2, btype = s1, s2, '='

111

i1, i2, btype = s1, s2, '='

111

if (i1 >= e1 or lines1[i1] == 0

112

if (i1 >= e1 or lines1[i1] == 0

112

or i2 >= e2 or lines2[i2] == 0):

113

or i2 >= e2 or lines2[i2] == 0):

113

# Consume the block of blank lines

114

# Consume the block of blank lines

114

btype = '~'

115

btype = '~'

115

while i1 < e1 and lines1[i1] == 0:

116

while i1 < e1 and lines1[i1] == 0:

116

i1 += 1

117

i1 += 1

117

while i2 < e2 and lines2[i2] == 0:

118

while i2 < e2 and lines2[i2] == 0:

118

i2 += 1

119

i2 += 1

119

else:

120

else:

120

# Consume the matching lines

121

# Consume the matching lines

121

while i1 < e1 and lines1[i1] == 1 and lines2[i2] == 1:

122

while i1 < e1 and lines1[i1] == 1 and lines2[i2] == 1:

122

i1 += 1

123

i1 += 1

123

i2 += 1

124

i2 += 1

124

yield [base1 + s1, base1 + i1, base2 + s2, base2 + i2], btype

125

yield [base1 + s1, base1 + i1, base2 + s2, base2 + i2], btype

125

s1 = i1

126

s1 = i1

126

s2 = i2

127

s2 = i2

127

128

def hunkinrange(hunk, linerange):

129

def hunkinrange(hunk, linerange):

129

"""Return True if `hunk` defined as (start, length) is in `linerange`

130

"""Return True if `hunk` defined as (start, length) is in `linerange`

130

defined as (lowerbound, upperbound).

131

defined as (lowerbound, upperbound).

131

132

>>> hunkinrange((5, 10), (2, 7))

133

>>> hunkinrange((5, 10), (2, 7))

133

True

134

True

134

>>> hunkinrange((5, 10), (6, 12))

135

>>> hunkinrange((5, 10), (6, 12))

135

True

136

True

136

>>> hunkinrange((5, 10), (13, 17))

137

>>> hunkinrange((5, 10), (13, 17))

137

True

138

True

138

>>> hunkinrange((5, 10), (3, 17))

139

>>> hunkinrange((5, 10), (3, 17))

139

True

140

True

140

>>> hunkinrange((5, 10), (1, 3))

141

>>> hunkinrange((5, 10), (1, 3))

141

False

142

False

142

>>> hunkinrange((5, 10), (18, 20))

143

>>> hunkinrange((5, 10), (18, 20))

143

False

144

False

144

>>> hunkinrange((5, 10), (1, 5))

145

>>> hunkinrange((5, 10), (1, 5))

145

False

146

False

146

>>> hunkinrange((5, 10), (15, 27))

147

>>> hunkinrange((5, 10), (15, 27))

147

False

148

False

148

"""

149

"""

149

start, length = hunk

150

start, length = hunk

150

lowerbound, upperbound = linerange

151

lowerbound, upperbound = linerange

151

return lowerbound < start + length and start < upperbound

152

return lowerbound < start + length and start < upperbound

152

153

def blocksinrange(blocks, rangeb):

154

def blocksinrange(blocks, rangeb):

154

"""filter `blocks` like (a1, a2, b1, b2) from items outside line range

155

"""filter `blocks` like (a1, a2, b1, b2) from items outside line range

155

`rangeb` from ``(b1, b2)`` point of view.

156

`rangeb` from ``(b1, b2)`` point of view.

156

157

Return `filteredblocks, rangea` where:

158

Return `filteredblocks, rangea` where:

158

159

* `filteredblocks` is list of ``block = (a1, a2, b1, b2), stype`` items of

160

* `filteredblocks` is list of ``block = (a1, a2, b1, b2), stype`` items of

160

`blocks` that are inside `rangeb` from ``(b1, b2)`` point of view; a

161

`blocks` that are inside `rangeb` from ``(b1, b2)`` point of view; a

161

block ``(b1, b2)`` being inside `rangeb` if

162

block ``(b1, b2)`` being inside `rangeb` if

162

``rangeb[0] < b2 and b1 < rangeb[1]``;

163

``rangeb[0] < b2 and b1 < rangeb[1]``;

163

* `rangea` is the line range w.r.t. to ``(a1, a2)`` parts of `blocks`.

164

* `rangea` is the line range w.r.t. to ``(a1, a2)`` parts of `blocks`.

164

"""

165

"""

165

lbb, ubb = rangeb

166

lbb, ubb = rangeb

166

lba, uba = None, None

167

lba, uba = None, None

167

filteredblocks = []

168

filteredblocks = []

168

for block in blocks:

169

for block in blocks:

169

(a1, a2, b1, b2), stype = block

170

(a1, a2, b1, b2), stype = block

170

if lbb >= b1 and ubb <= b2 and stype == '=':

171

if lbb >= b1 and ubb <= b2 and stype == '=':

171

# rangeb is within a single "=" hunk, restrict back linerange1

172

# rangeb is within a single "=" hunk, restrict back linerange1

172

# by offsetting rangeb

173

# by offsetting rangeb

173

lba = lbb - b1 + a1

174

lba = lbb - b1 + a1

174

uba = ubb - b1 + a1

175

uba = ubb - b1 + a1

175

else:

176

else:

176

if b1 <= lbb < b2:

177

if b1 <= lbb < b2:

177

if stype == '=':

178

if stype == '=':

178

lba = a2 - (b2 - lbb)

179

lba = a2 - (b2 - lbb)

179

else:

180

else:

180

lba = a1

181

lba = a1

181

if b1 < ubb <= b2:

182

if b1 < ubb <= b2:

182

if stype == '=':

183

if stype == '=':

183

uba = a1 + (ubb - b1)

184

uba = a1 + (ubb - b1)

184

else:

185

else:

185

uba = a2

186

uba = a2

186

if hunkinrange((b1, (b2 - b1)), rangeb):

187

if hunkinrange((b1, (b2 - b1)), rangeb):

187

filteredblocks.append(block)

188

filteredblocks.append(block)

188

if lba is None or uba is None or uba < lba:

189

if lba is None or uba is None or uba < lba:

189

raise error.Abort(_('line range exceeds file size'))

190

raise error.Abort(_('line range exceeds file size'))

190

return filteredblocks, (lba, uba)

191

return filteredblocks, (lba, uba)

191

192

def chooseblocksfunc(opts=None):

193

def chooseblocksfunc(opts=None):

193

if (opts is None or not opts.xdiff

194

if (opts is None or not opts.xdiff

194

or not util.safehasattr(bdiff, 'xdiffblocks')):

195

or not util.safehasattr(bdiff, 'xdiffblocks')):

195

return bdiff.blocks

196

return bdiff.blocks

196

else:

197

else:

197

return bdiff.xdiffblocks

198

return bdiff.xdiffblocks

198

199

def allblocks(text1, text2, opts=None, lines1=None, lines2=None):

200

def allblocks(text1, text2, opts=None, lines1=None, lines2=None):

200

"""Return (block, type) tuples, where block is an mdiff.blocks

201

"""Return (block, type) tuples, where block is an mdiff.blocks

201

line entry. type is '=' for blocks matching exactly one another

202

line entry. type is '=' for blocks matching exactly one another

202

(bdiff blocks), '!' for non-matching blocks and '~' for blocks

203

(bdiff blocks), '!' for non-matching blocks and '~' for blocks

203

matching only after having filtered blank lines.

204

matching only after having filtered blank lines.

204

line1 and line2 are text1 and text2 split with splitnewlines() if

205

line1 and line2 are text1 and text2 split with splitnewlines() if

205

they are already available.

206

they are already available.

206

"""

207

"""

207

if opts is None:

208

if opts is None:

208

opts = defaultopts

209

opts = defaultopts

209

if opts.ignorews or opts.ignorewsamount or opts.ignorewseol:

210

if opts.ignorews or opts.ignorewsamount or opts.ignorewseol:

210

text1 = wsclean(opts, text1, False)

211

text1 = wsclean(opts, text1, False)

211

text2 = wsclean(opts, text2, False)

212

text2 = wsclean(opts, text2, False)

212

diff = chooseblocksfunc(opts)(text1, text2)

213

diff = chooseblocksfunc(opts)(text1, text2)

213

for i, s1 in enumerate(diff):

214

for i, s1 in enumerate(diff):

214

# The first match is special.

215

# The first match is special.

215

# we've either found a match starting at line 0 or a match later

216

# we've either found a match starting at line 0 or a match later

216

# in the file. If it starts later, old and new below will both be

217

# in the file. If it starts later, old and new below will both be

217

# empty and we'll continue to the next match.

218

# empty and we'll continue to the next match.

218

if i > 0:

219

if i > 0:

219

s = diff[i - 1]

220

s = diff[i - 1]

220

else:

221

else:

221

s = [0, 0, 0, 0]

222

s = [0, 0, 0, 0]

222

s = [s[1], s1[0], s[3], s1[2]]

223

s = [s[1], s1[0], s[3], s1[2]]

223

224

# bdiff sometimes gives huge matches past eof, this check eats them,

225

# bdiff sometimes gives huge matches past eof, this check eats them,

225

# and deals with the special first match case described above

226

# and deals with the special first match case described above

226

if s[0] != s[1] or s[2] != s[3]:

227

if s[0] != s[1] or s[2] != s[3]:

227

type = '!'

228

type = '!'

228

if opts.ignoreblanklines:

229

if opts.ignoreblanklines:

229

if lines1 is None:

230

if lines1 is None:

230

lines1 = splitnewlines(text1)

231

lines1 = splitnewlines(text1)

231

if lines2 is None:

232

if lines2 is None:

232

lines2 = splitnewlines(text2)

233

lines2 = splitnewlines(text2)

233

old = wsclean(opts, "".join(lines1[s[0]:s[1]]))

234

old = wsclean(opts, "".join(lines1[s[0]:s[1]]))

234

new = wsclean(opts, "".join(lines2[s[2]:s[3]]))

235

new = wsclean(opts, "".join(lines2[s[2]:s[3]]))

235

if old == new:

236

if old == new:

236

type = '~'

237

type = '~'

237

yield s, type

238

yield s, type

238

yield s1, '='

239

yield s1, '='

239

240

def unidiff(a, ad, b, bd, fn1, fn2, binary, opts=defaultopts):

241

def unidiff(a, ad, b, bd, fn1, fn2, binary, opts=defaultopts):

241

"""Return a unified diff as a (headers, hunks) tuple.

242

"""Return a unified diff as a (headers, hunks) tuple.

242

243

If the diff is not null, `headers` is a list with unified diff header

244

If the diff is not null, `headers` is a list with unified diff header

244

lines "--- <original>" and "+++ <new>" and `hunks` is a generator yielding

245

lines "--- <original>" and "+++ <new>" and `hunks` is a generator yielding

245

(hunkrange, hunklines) coming from _unidiff().

246

(hunkrange, hunklines) coming from _unidiff().

246

Otherwise, `headers` and `hunks` are empty.

247

Otherwise, `headers` and `hunks` are empty.

247

248

Set binary=True if either a or b should be taken as a binary file.

249

Set binary=True if either a or b should be taken as a binary file.

249

"""

250

"""

250

def datetag(date, fn=None):

251

def datetag(date, fn=None):

251

if not opts.git and not opts.nodates:

252

if not opts.git and not opts.nodates:

252

return '\t%s' % date

253

return '\t%s' % date

253

if fn and ' ' in fn:

254

if fn and ' ' in fn:

254

return '\t'

255

return '\t'

255

return ''

256

return ''

256

257

sentinel = [], ()

258

sentinel = [], ()

258

if not a and not b:

259

if not a and not b:

259

return sentinel

260

return sentinel

260

261

if opts.noprefix:

262

if opts.noprefix:

262

aprefix = bprefix = ''

263

aprefix = bprefix = ''

263

else:

264

else:

264

aprefix = 'a/'

265

aprefix = 'a/'

265

bprefix = 'b/'

266

bprefix = 'b/'

266

267

epoch = dateutil.datestr((0, 0))

268

epoch = dateutil.datestr((0, 0))

268

269

fn1 = util.pconvert(fn1)

270

fn1 = util.pconvert(fn1)

270

fn2 = util.pconvert(fn2)

271

fn2 = util.pconvert(fn2)

271

272

if binary:

273

if binary:

273

if a and b and len(a) == len(b) and a == b:

274

if a and b and len(a) == len(b) and a == b:

274

return sentinel

275

return sentinel

275

headerlines = []

276

headerlines = []

276

hunks = (None, ['Binary file %s has changed\n' % fn1]),

277

hunks = (None, ['Binary file %s has changed\n' % fn1]),

277

elif not a:

278

elif not a:

278

without_newline = not b.endswith('\n')

279

without_newline = not b.endswith('\n')

279

b = splitnewlines(b)

280

b = splitnewlines(b)

280

if a is None:

281

if a is None:

281

l1 = '--- /dev/null%s' % datetag(epoch)

282

l1 = '--- /dev/null%s' % datetag(epoch)

282

else:

283

else:

283

l1 = "--- %s%s%s" % (aprefix, fn1, datetag(ad, fn1))

284

l1 = "--- %s%s%s" % (aprefix, fn1, datetag(ad, fn1))

284

l2 = "+++ %s%s" % (bprefix + fn2, datetag(bd, fn2))

285

l2 = "+++ %s%s" % (bprefix + fn2, datetag(bd, fn2))

285

headerlines = [l1, l2]

286

headerlines = [l1, l2]

286

size = len(b)

287

size = len(b)

287

hunkrange = (0, 0, 1, size)

288

hunkrange = (0, 0, 1, size)

288

hunklines = ["@@ -0,0 +1,%d @@\n" % size] + ["+" + e for e in b]

289

hunklines = ["@@ -0,0 +1,%d @@\n" % size] + ["+" + e for e in b]

289

if without_newline:

290

if without_newline:

290

hunklines[-1] += '\n'

291

hunklines[-1] += '\n'

291

hunklines.append(_missing_newline_marker)

292

hunklines.append(_missing_newline_marker)

292

hunks = (hunkrange, hunklines),

293

hunks = (hunkrange, hunklines),

293

elif not b:

294

elif not b:

294

without_newline = not a.endswith('\n')

295

without_newline = not a.endswith('\n')

295

a = splitnewlines(a)

296

a = splitnewlines(a)

296

l1 = "--- %s%s%s" % (aprefix, fn1, datetag(ad, fn1))

297

l1 = "--- %s%s%s" % (aprefix, fn1, datetag(ad, fn1))

297

if b is None:

298

if b is None:

298

l2 = '+++ /dev/null%s' % datetag(epoch)

299

l2 = '+++ /dev/null%s' % datetag(epoch)

299

else:

300

else:

300

l2 = "+++ %s%s%s" % (bprefix, fn2, datetag(bd, fn2))

301

l2 = "+++ %s%s%s" % (bprefix, fn2, datetag(bd, fn2))

301

headerlines = [l1, l2]

302

headerlines = [l1, l2]

302

size = len(a)

303

size = len(a)

303

hunkrange = (1, size, 0, 0)

304

hunkrange = (1, size, 0, 0)

304

hunklines = ["@@ -1,%d +0,0 @@\n" % size] + ["-" + e for e in a]

305

hunklines = ["@@ -1,%d +0,0 @@\n" % size] + ["-" + e for e in a]

305

if without_newline:

306

if without_newline:

306

hunklines[-1] += '\n'

307

hunklines[-1] += '\n'

307

hunklines.append(_missing_newline_marker)

308

hunklines.append(_missing_newline_marker)

308

hunks = (hunkrange, hunklines),

309

hunks = (hunkrange, hunklines),

309

else:

310

else:

310

hunks = _unidiff(a, b, opts=opts)

311

hunks = _unidiff(a, b, opts=opts)

311

if not next(hunks):

312

if not next(hunks):

312

return sentinel

313

return sentinel

313

314

headerlines = [

315

headerlines = [

315

"--- %s%s%s" % (aprefix, fn1, datetag(ad, fn1)),

316

"--- %s%s%s" % (aprefix, fn1, datetag(ad, fn1)),

316

"+++ %s%s%s" % (bprefix, fn2, datetag(bd, fn2)),

317

"+++ %s%s%s" % (bprefix, fn2, datetag(bd, fn2)),

317

]

318

]

318

319

return headerlines, hunks

320

return headerlines, hunks

320

321

def _unidiff(t1, t2, opts=defaultopts):

322

def _unidiff(t1, t2, opts=defaultopts):

322

"""Yield hunks of a headerless unified diff from t1 and t2 texts.

323

"""Yield hunks of a headerless unified diff from t1 and t2 texts.

323

324

Each hunk consists of a (hunkrange, hunklines) tuple where `hunkrange` is a

325

Each hunk consists of a (hunkrange, hunklines) tuple where `hunkrange` is a

325

tuple (s1, l1, s2, l2) representing the range information of the hunk to

326

tuple (s1, l1, s2, l2) representing the range information of the hunk to

326

form the '@@ -s1,l1 +s2,l2 @@' header and `hunklines` is a list of lines

327

form the '@@ -s1,l1 +s2,l2 @@' header and `hunklines` is a list of lines

327

of the hunk combining said header followed by line additions and

328

of the hunk combining said header followed by line additions and

328

deletions.

329

deletions.

329

330

The hunks are prefixed with a bool.

331

The hunks are prefixed with a bool.

331

"""

332

"""

332

l1 = splitnewlines(t1)

333

l1 = splitnewlines(t1)

333

l2 = splitnewlines(t2)

334

l2 = splitnewlines(t2)

334

def contextend(l, len):

335

def contextend(l, len):

335

ret = l + opts.context

336

ret = l + opts.context

336

if ret > len:

337

if ret > len:

337

ret = len

338

ret = len

338

return ret

339

return ret

339

340

def contextstart(l):

341

def contextstart(l):

341

ret = l - opts.context

342

ret = l - opts.context

342

if ret < 0:

343

if ret < 0:

343

return 0

344

return 0

344

return ret

345

return ret

345

346

lastfunc = [0, '']

347

lastfunc = [0, '']

347

def yieldhunk(hunk):

348

def yieldhunk(hunk):

348

(astart, a2, bstart, b2, delta) = hunk

349

(astart, a2, bstart, b2, delta) = hunk

349

aend = contextend(a2, len(l1))

350

aend = contextend(a2, len(l1))

350

alen = aend - astart

351

alen = aend - astart

351

blen = b2 - bstart + aend - a2

352

blen = b2 - bstart + aend - a2

352

353

func = ""

354

func = ""

354

if opts.showfunc:

355

if opts.showfunc:

355

lastpos, func = lastfunc

356

lastpos, func = lastfunc

356

# walk backwards from the start of the context up to the start of

357

# walk backwards from the start of the context up to the start of

357

# the previous hunk context until we find a line starting with an

358

# the previous hunk context until we find a line starting with an

358

# alphanumeric char.

359

# alphanumeric char.

359

for i in xrange(astart - 1, lastpos - 1, -1):

360

for i in xrange(astart - 1, lastpos - 1, -1):

360

if l1[i][0:1].isalnum():

361

if l1[i][0:1].isalnum():

361

func = b' ' + l1[i].rstrip()

362

func = b' ' + l1[i].rstrip()

362

# split long function name if ASCII. otherwise we have no

363

# split long function name if ASCII. otherwise we have no

363

# idea where the multi-byte boundary is, so just leave it.

364

# idea where the multi-byte boundary is, so just leave it.

364

if encoding.isasciistr(func):

365

if encoding.isasciistr(func):

365

func = func[:41]

366

func = func[:41]

366

lastfunc[1] = func

367

lastfunc[1] = func

367

break

368

break

368

# by recording this hunk's starting point as the next place to

369

# by recording this hunk's starting point as the next place to

369

# start looking for function lines, we avoid reading any line in

370

# start looking for function lines, we avoid reading any line in

370

# the file more than once.

371

# the file more than once.

371

lastfunc[0] = astart

372

lastfunc[0] = astart

372

373

# zero-length hunk ranges report their start line as one less

374

# zero-length hunk ranges report their start line as one less

374

if alen:

375

if alen:

375

astart += 1

376

astart += 1

376

if blen:

377

if blen:

377

bstart += 1

378

bstart += 1

378

379

hunkrange = astart, alen, bstart, blen

380

hunkrange = astart, alen, bstart, blen

380

hunklines = (

381

hunklines = (

381

["@@ -%d,%d +%d,%d @@%s\n" % (hunkrange + (func,))]

382

["@@ -%d,%d +%d,%d @@%s\n" % (hunkrange + (func,))]

382

+ delta

383

+ delta

383

+ [' ' + l1[x] for x in xrange(a2, aend)]

384

+ [' ' + l1[x] for x in xrange(a2, aend)]

384

)

385

)

385

# If either file ends without a newline and the last line of

386

# If either file ends without a newline and the last line of

386

# that file is part of a hunk, a marker is printed. If the

387

# that file is part of a hunk, a marker is printed. If the

387

# last line of both files is identical and neither ends in

388

# last line of both files is identical and neither ends in

388

# a newline, print only one marker. That's the only case in

389

# a newline, print only one marker. That's the only case in

389

# which the hunk can end in a shared line without a newline.

390

# which the hunk can end in a shared line without a newline.

390

skip = False

391

skip = False

391

if not t1.endswith('\n') and astart + alen == len(l1) + 1:

392

if not t1.endswith('\n') and astart + alen == len(l1) + 1:

392

for i in xrange(len(hunklines) - 1, -1, -1):

393

for i in xrange(len(hunklines) - 1, -1, -1):

393

if hunklines[i].startswith(('-', ' ')):

394

if hunklines[i].startswith(('-', ' ')):

394

if hunklines[i].startswith(' '):

395

if hunklines[i].startswith(' '):

395

skip = True

396

skip = True

396

hunklines[i] += '\n'

397

hunklines[i] += '\n'

397

hunklines.insert(i + 1, _missing_newline_marker)

398

hunklines.insert(i + 1, _missing_newline_marker)

398

break

399

break

399

if not skip and not t2.endswith('\n') and bstart + blen == len(l2) + 1:

400

if not skip and not t2.endswith('\n') and bstart + blen == len(l2) + 1:

400

for i in xrange(len(hunklines) - 1, -1, -1):

401

for i in xrange(len(hunklines) - 1, -1, -1):

401

if hunklines[i].startswith('+'):

402

if hunklines[i].startswith('+'):

402

hunklines[i] += '\n'

403

hunklines[i] += '\n'

403

hunklines.insert(i + 1, _missing_newline_marker)

404

hunklines.insert(i + 1, _missing_newline_marker)

404

break

405

break

405

yield hunkrange, hunklines

406

yield hunkrange, hunklines

406

407

# bdiff.blocks gives us the matching sequences in the files. The loop

408

# bdiff.blocks gives us the matching sequences in the files. The loop

408

# below finds the spaces between those matching sequences and translates

409

# below finds the spaces between those matching sequences and translates

409

# them into diff output.

410

# them into diff output.

410

#

411

#

411

hunk = None

412

hunk = None

412

ignoredlines = 0

413

ignoredlines = 0

413

has_hunks = False

414

has_hunks = False

414

for s, stype in allblocks(t1, t2, opts, l1, l2):

415

for s, stype in allblocks(t1, t2, opts, l1, l2):

415

a1, a2, b1, b2 = s

416

a1, a2, b1, b2 = s

416

if stype != '!':

417

if stype != '!':

417

if stype == '~':

418

if stype == '~':

418

# The diff context lines are based on t1 content. When

419

# The diff context lines are based on t1 content. When

419

# blank lines are ignored, the new lines offsets must

420

# blank lines are ignored, the new lines offsets must

420

# be adjusted as if equivalent blocks ('~') had the

421

# be adjusted as if equivalent blocks ('~') had the

421

# same sizes on both sides.

422

# same sizes on both sides.

422

ignoredlines += (b2 - b1) - (a2 - a1)

423

ignoredlines += (b2 - b1) - (a2 - a1)

423

continue

424

continue

424

delta = []

425

delta = []

425

old = l1[a1:a2]

426

old = l1[a1:a2]

426

new = l2[b1:b2]

427

new = l2[b1:b2]

427

428

b1 -= ignoredlines

429

b1 -= ignoredlines

429

b2 -= ignoredlines

430

b2 -= ignoredlines

430

astart = contextstart(a1)

431

astart = contextstart(a1)

431

bstart = contextstart(b1)

432

bstart = contextstart(b1)

432

prev = None

433

prev = None

433

if hunk:

434

if hunk:

434

# join with the previous hunk if it falls inside the context

435

# join with the previous hunk if it falls inside the context

435

if astart < hunk[1] + opts.context + 1:

436

if astart < hunk[1] + opts.context + 1:

436

prev = hunk

437

prev = hunk

437

astart = hunk[1]

438

astart = hunk[1]

438

bstart = hunk[3]

439

bstart = hunk[3]

439

else:

440

else:

440

if not has_hunks:

441

if not has_hunks:

441

has_hunks = True

442

has_hunks = True

442

yield True

443

yield True

443

for x in yieldhunk(hunk):

444

for x in yieldhunk(hunk):

444

yield x

445

yield x

445

if prev:

446

if prev:

446

# we've joined the previous hunk, record the new ending points.

447

# we've joined the previous hunk, record the new ending points.

447

hunk[1] = a2

448

hunk[1] = a2

448

hunk[3] = b2

449

hunk[3] = b2

449

delta = hunk[4]

450

delta = hunk[4]

450

else:

451

else:

451

# create a new hunk

452

# create a new hunk

452

hunk = [astart, a2, bstart, b2, delta]

453

hunk = [astart, a2, bstart, b2, delta]

453

454

delta[len(delta):] = [' ' + x for x in l1[astart:a1]]

455

delta[len(delta):] = [' ' + x for x in l1[astart:a1]]

455

delta[len(delta):] = ['-' + x for x in old]

456

delta[len(delta):] = ['-' + x for x in old]

456

delta[len(delta):] = ['+' + x for x in new]

457

delta[len(delta):] = ['+' + x for x in new]

457

458

if hunk:

459

if hunk:

459

if not has_hunks:

460

if not has_hunks:

460

has_hunks = True

461

has_hunks = True

461

yield True

462

yield True

462

for x in yieldhunk(hunk):

463

for x in yieldhunk(hunk):

463

yield x

464

yield x

464

elif not has_hunks:

465

elif not has_hunks:

465

yield False

466

yield False

466

467

def b85diff(to, tn):

468

def b85diff(to, tn):

468

'''print base85-encoded binary diff'''

469

'''print base85-encoded binary diff'''

469

def fmtline(line):

470

def fmtline(line):

470

l = len(line)

471

l = len(line)

471

if l <= 26:

472

if l <= 26:

472

l = pycompat.bytechr(ord('A') + l - 1)

473

l = pycompat.bytechr(ord('A') + l - 1)

473

else:

474

else:

474

l = pycompat.bytechr(l - 26 + ord('a') - 1)

475

l = pycompat.bytechr(l - 26 + ord('a') - 1)

475

return '%c%s\n' % (l, util.b85encode(line, True))

476

return '%c%s\n' % (l, util.b85encode(line, True))

476

477

def chunk(text, csize=52):

478

def chunk(text, csize=52):

478

l = len(text)

479

l = len(text)

479

i = 0

480

i = 0

480

while i < l:

481

while i < l:

481

yield text[i:i + csize]

482

yield text[i:i + csize]

482

i += csize

483

i += csize

483

484

if to is None:

485

if to is None:

485

to = ''

486

to = ''

486

if tn is None:

487

if tn is None:

487

tn = ''

488

tn = ''

488

489

if to == tn:

490

if to == tn:

490

return ''

491

return ''

491

492

# TODO: deltas

493

# TODO: deltas

493

ret = []

494

ret = []

494

ret.append('GIT binary patch\n')

495

ret.append('GIT binary patch\n')

495

ret.append('literal %d\n' % len(tn))

496

ret.append('literal %d\n' % len(tn))

496

for l in chunk(zlib.compress(tn)):

497

for l in chunk(zlib.compress(tn)):

497

ret.append(fmtline(l))

498

ret.append(fmtline(l))

498

ret.append('\n')

499

ret.append('\n')

499

500

return ''.join(ret)

501

return ''.join(ret)

501

502

def patchtext(bin):

503

def patchtext(bin):

503

pos = 0

504

pos = 0

504

t = []

505

t = []

505

while pos < len(bin):

506

while pos < len(bin):

506

p1, p2, l = struct.unpack(">lll", bin[pos:pos + 12])

507

p1, p2, l = struct.unpack(">lll", bin[pos:pos + 12])

507

pos += 12

508

pos += 12

508

t.append(bin[pos:pos + l])

509

t.append(bin[pos:pos + l])

509

pos += l

510

pos += l

510

return "".join(t)

511

return "".join(t)

511

512

def patch(a, bin):

513

def patch(a, bin):

513

if len(a) == 0:

514

if len(a) == 0:

514

# skip over trivial delta header

515

# skip over trivial delta header

515

return util.buffer(bin, 12)

516

return util.buffer(bin, 12)

516

return mpatch.patches(a, [bin])

517

return mpatch.patches(a, [bin])

517

518

# similar to difflib.SequenceMatcher.get_matching_blocks

519

# similar to difflib.SequenceMatcher.get_matching_blocks

519

def get_matching_blocks(a, b):

520

def get_matching_blocks(a, b):

520

return [(d[0], d[2], d[1] - d[0]) for d in bdiff.blocks(a, b)]

521

return [(d[0], d[2], d[1] - d[0]) for d in bdiff.blocks(a, b)]

521

522

def trivialdiffheader(length):

523

def trivialdiffheader(length):

523

return struct.pack(">lll", 0, 0, length) if length else ''

524

return struct.pack(">lll", 0, 0, length) if length else ''

524

525

def replacediffheader(oldlen, newlen):

526

def replacediffheader(oldlen, newlen):

526

return struct.pack(">lll", 0, oldlen, newlen)

527

return struct.pack(">lll", 0, oldlen, newlen)

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages

             # mdiff.py - diff and patch routines for mercurial
             #
             # Copyright 2005, 2006 Matt Mackall <mpm@selenic.com>
             #
             # This software may be used and distributed according to the terms of the
             # GNU General Public License version 2 or any later version.
             from __future__ import absolute_import
             import re
             import struct
             import zlib
             from .i18n import _
             from . import (
                 encoding,
                 error,
                 policy,
                 pycompat,
                 util,
             )
             from .utils import dateutil
             _missing_newline_marker = "\\ No newline at end of file\n"
             bdiff = policy.importmod(r'bdiff')
             mpatch = policy.importmod(r'mpatch')
             blocks = bdiff.blocks
             fixws = bdiff.fixws
             patches = mpatch.patches
             patchedsize = mpatch.patchedsize
             textdiff = bdiff.bdiff
             splitnewlines = bdiff.splitnewlines
             class diffopts(object):
                 '''context is the number of context lines
                 text treats all files as text
                 showfunc enables diff -p output
                 git enables the git extended patch format
                 nodates removes dates from diff headers
                 nobinary ignores binary files
                 noprefix disables the 'a/' and 'b/' prefixes (ignored in plain mode)
                 ignorews ignores all whitespace changes in the diff
                 ignorewsamount ignores changes in the amount of whitespace
                 ignoreblanklines ignores changes whose lines are all blank
                 upgrade generates git diffs to avoid data loss
                 '''
                 defaults = {
                     'context': 3,
                     'text': False,
                     'showfunc': False,
                     'git': False,
                     'nodates': False,
                     'nobinary': False,
                     'noprefix': False,
                     'index': 0,
                     'ignorews': False,
                     'ignorewsamount': False,
                     'ignorewseol': False,
                     'ignoreblanklines': False,
                     'upgrade': False,
                     'showsimilarity': False,
                     'worddiff': False,
                     'xdiff': False,
                     }
                 def __init__(self, **opts):
                     opts = pycompat.byteskwargs(opts)
                     for k in self.defaults.keys():
                         v = opts.get(k)
                         if v is None:
                             v = self.defaults[k]
                         setattr(self, k, v)
                     try:
                         self.context = int(self.context)
                     except ValueError:
                         raise error.Abort(_('diff context lines count must be '
-                                           'an integer, not %r') % self.context)
+                                            'an integer, not %r') %
+                                          pycompat.bytestr(self.context))
                 def copy(self, **kwargs):
                     opts = dict((k, getattr(self, k)) for k in self.defaults)
                     opts = pycompat.strkwargs(opts)
                     opts.update(kwargs)
                     return diffopts(**opts)
             defaultopts = diffopts()
             def wsclean(opts, text, blank=True):
                 if opts.ignorews:
                     text = bdiff.fixws(text, 1)
                 elif opts.ignorewsamount:
                     text = bdiff.fixws(text, 0)
                 if blank and opts.ignoreblanklines:
                     text = re.sub('\n+', '\n', text).strip('\n')
                 if opts.ignorewseol:
                     text = re.sub(br'[ \t\r\f]+\n', r'\n', text)
                 return text
             def splitblock(base1, lines1, base2, lines2, opts):
                 # The input lines matches except for interwoven blank lines. We
                 # transform it into a sequence of matching blocks and blank blocks.
                 lines1 = [(wsclean(opts, l) and 1 or 0) for l in lines1]
                 lines2 = [(wsclean(opts, l) and 1 or 0) for l in lines2]
                 s1, e1 = 0, len(lines1)
                 s2, e2 = 0, len(lines2)
                 while s1 < e1 or s2 < e2:
                     i1, i2, btype = s1, s2, '='
                     if (i1 >= e1 or lines1[i1] == 0
                         or i2 >= e2 or lines2[i2] == 0):
                         # Consume the block of blank lines
                         btype = '~'
                         while i1 < e1 and lines1[i1] == 0:
                             i1 += 1
                         while i2 < e2 and lines2[i2] == 0:
                             i2 += 1
                     else:
                         # Consume the matching lines
                         while i1 < e1 and lines1[i1] == 1 and lines2[i2] == 1:
                             i1 += 1
                             i2 += 1
                     yield [base1 + s1, base1 + i1, base2 + s2, base2 + i2], btype
                     s1 = i1
                     s2 = i2
             def hunkinrange(hunk, linerange):
                 """Return True if `hunk` defined as (start, length) is in `linerange`
                 defined as (lowerbound, upperbound).
                 >>> hunkinrange((5, 10), (2, 7))
                 True
                 >>> hunkinrange((5, 10), (6, 12))
                 True
                 >>> hunkinrange((5, 10), (13, 17))
                 True
                 >>> hunkinrange((5, 10), (3, 17))
                 True
                 >>> hunkinrange((5, 10), (1, 3))
                 False
                 >>> hunkinrange((5, 10), (18, 20))
                 False
                 >>> hunkinrange((5, 10), (1, 5))
                 False
                 >>> hunkinrange((5, 10), (15, 27))
                 False
                 """
                 start, length = hunk
                 lowerbound, upperbound = linerange
                 return lowerbound < start + length and start < upperbound
             def blocksinrange(blocks, rangeb):
                 """filter `blocks` like (a1, a2, b1, b2) from items outside line range
                 `rangeb` from ``(b1, b2)`` point of view.
                 Return `filteredblocks, rangea` where:
                 * `filteredblocks` is list of ``block = (a1, a2, b1, b2), stype`` items of
                   `blocks` that are inside `rangeb` from ``(b1, b2)`` point of view; a
                   block ``(b1, b2)`` being inside `rangeb` if
                   ``rangeb[0] < b2 and b1 < rangeb[1]``;
                 * `rangea` is the line range w.r.t. to ``(a1, a2)`` parts of `blocks`.
                 """
                 lbb, ubb = rangeb
                 lba, uba = None, None
                 filteredblocks = []
                 for block in blocks:
                     (a1, a2, b1, b2), stype = block
                     if lbb >= b1 and ubb <= b2 and stype == '=':
                         # rangeb is within a single "=" hunk, restrict back linerange1
                         # by offsetting rangeb
                         lba = lbb - b1 + a1
                         uba = ubb - b1 + a1
                     else:
                         if b1 <= lbb < b2:
                             if stype == '=':
                                 lba = a2 - (b2 - lbb)
                             else:
                                 lba = a1
                         if b1 < ubb <= b2:
                             if stype == '=':
                                 uba = a1 + (ubb - b1)
                             else:
                                 uba = a2
                     if hunkinrange((b1, (b2 - b1)), rangeb):
                         filteredblocks.append(block)
                 if lba is None or uba is None or uba < lba:
                     raise error.Abort(_('line range exceeds file size'))
                 return filteredblocks, (lba, uba)
             def chooseblocksfunc(opts=None):
                 if (opts is None or not opts.xdiff
                     or not util.safehasattr(bdiff, 'xdiffblocks')):
                     return bdiff.blocks
                 else:
                     return bdiff.xdiffblocks
             def allblocks(text1, text2, opts=None, lines1=None, lines2=None):
                 """Return (block, type) tuples, where block is an mdiff.blocks
                 line entry. type is '=' for blocks matching exactly one another
                 (bdiff blocks), '!' for non-matching blocks and '~' for blocks
                 matching only after having filtered blank lines.
                 line1 and line2 are text1 and text2 split with splitnewlines() if
                 they are already available.
                 """
                 if opts is None:
                     opts = defaultopts
                 if opts.ignorews or opts.ignorewsamount or opts.ignorewseol:
                     text1 = wsclean(opts, text1, False)
                     text2 = wsclean(opts, text2, False)
                 diff = chooseblocksfunc(opts)(text1, text2)
                 for i, s1 in enumerate(diff):
                     # The first match is special.
                     # we've either found a match starting at line 0 or a match later
                     # in the file.  If it starts later, old and new below will both be
                     # empty and we'll continue to the next match.
                     if i > 0:
                         s = diff[i - 1]
                     else:
                         s = [0, 0, 0, 0]
                     s = [s[1], s1[0], s[3], s1[2]]
                     # bdiff sometimes gives huge matches past eof, this check eats them,
                     # and deals with the special first match case described above
                     if s[0] != s[1] or s[2] != s[3]:
                         type = '!'
                         if opts.ignoreblanklines:
                             if lines1 is None:
                                 lines1 = splitnewlines(text1)
                             if lines2 is None:
                                 lines2 = splitnewlines(text2)
                             old = wsclean(opts, "".join(lines1[s[0]:s[1]]))
                             new = wsclean(opts, "".join(lines2[s[2]:s[3]]))
                             if old == new:
                                 type = '~'
                         yield s, type
                     yield s1, '='
             def unidiff(a, ad, b, bd, fn1, fn2, binary, opts=defaultopts):
                 """Return a unified diff as a (headers, hunks) tuple.
                 If the diff is not null, `headers` is a list with unified diff header
                 lines "--- <original>" and "+++ <new>" and `hunks` is a generator yielding
                 (hunkrange, hunklines) coming from _unidiff().
                 Otherwise, `headers` and `hunks` are empty.
                 Set binary=True if either a or b should be taken as a binary file.
                 """
                 def datetag(date, fn=None):
                     if not opts.git and not opts.nodates:
                         return '\t%s' % date
                     if fn and ' ' in fn:
                         return '\t'
                     return ''
                 sentinel = [], ()
                 if not a and not b:
                     return sentinel
                 if opts.noprefix:
                     aprefix = bprefix = ''
                 else:
                     aprefix = 'a/'
                     bprefix = 'b/'
                 epoch = dateutil.datestr((0, 0))
                 fn1 = util.pconvert(fn1)
                 fn2 = util.pconvert(fn2)
                 if binary:
                     if a and b and len(a) == len(b) and a == b:
                         return sentinel
                     headerlines = []
                     hunks = (None, ['Binary file %s has changed\n' % fn1]),
                 elif not a:
                     without_newline = not b.endswith('\n')
                     b = splitnewlines(b)
                     if a is None:
                         l1 = '--- /dev/null%s' % datetag(epoch)
                     else:
                         l1 = "--- %s%s%s" % (aprefix, fn1, datetag(ad, fn1))
                     l2 = "+++ %s%s" % (bprefix + fn2, datetag(bd, fn2))
                     headerlines = [l1, l2]
                     size = len(b)
                     hunkrange = (0, 0, 1, size)
                     hunklines = ["@@ -0,0 +1,%d @@\n" % size] + ["+" + e for e in b]
                     if without_newline:
                         hunklines[-1] += '\n'
                         hunklines.append(_missing_newline_marker)
                     hunks = (hunkrange, hunklines),
                 elif not b:
                     without_newline = not a.endswith('\n')
                     a = splitnewlines(a)
                     l1 = "--- %s%s%s" % (aprefix, fn1, datetag(ad, fn1))
                     if b is None:
                         l2 = '+++ /dev/null%s' % datetag(epoch)
                     else:
                         l2 = "+++ %s%s%s" % (bprefix, fn2, datetag(bd, fn2))
                     headerlines = [l1, l2]
                     size = len(a)
                     hunkrange = (1, size, 0, 0)
                     hunklines = ["@@ -1,%d +0,0 @@\n" % size] + ["-" + e for e in a]
                     if without_newline:
                         hunklines[-1] += '\n'
                         hunklines.append(_missing_newline_marker)
                     hunks = (hunkrange, hunklines),
                 else:
                     hunks = _unidiff(a, b, opts=opts)
                     if not next(hunks):
                         return sentinel
                     headerlines = [
                         "--- %s%s%s" % (aprefix, fn1, datetag(ad, fn1)),
                         "+++ %s%s%s" % (bprefix, fn2, datetag(bd, fn2)),
                     ]
                 return headerlines, hunks
             def _unidiff(t1, t2, opts=defaultopts):
                 """Yield hunks of a headerless unified diff from t1 and t2 texts.
                 Each hunk consists of a (hunkrange, hunklines) tuple where `hunkrange` is a
                 tuple (s1, l1, s2, l2) representing the range information of the hunk to
                 form the '@@ -s1,l1 +s2,l2 @@' header and `hunklines` is a list of lines
                 of the hunk combining said header followed by line additions and
                 deletions.
                 The hunks are prefixed with a bool.
                 """
                 l1 = splitnewlines(t1)
                 l2 = splitnewlines(t2)
                 def contextend(l, len):
                     ret = l + opts.context
                     if ret > len:
                         ret = len
                     return ret
                 def contextstart(l):
                     ret = l - opts.context
                     if ret < 0:
                         return 0
                     return ret
                 lastfunc = [0, '']
                 def yieldhunk(hunk):
                     (astart, a2, bstart, b2, delta) = hunk
                     aend = contextend(a2, len(l1))
                     alen = aend - astart
                     blen = b2 - bstart + aend - a2
                     func = ""
                     if opts.showfunc:
                         lastpos, func = lastfunc
                         # walk backwards from the start of the context up to the start of
                         # the previous hunk context until we find a line starting with an
                         # alphanumeric char.
                         for i in xrange(astart - 1, lastpos - 1, -1):
                             if l1[i][0:1].isalnum():
                                 func = b' ' + l1[i].rstrip()
                                 # split long function name if ASCII. otherwise we have no
                                 # idea where the multi-byte boundary is, so just leave it.
                                 if encoding.isasciistr(func):
                                     func = func[:41]
                                 lastfunc[1] = func
                                 break
                         # by recording this hunk's starting point as the next place to
                         # start looking for function lines, we avoid reading any line in
                         # the file more than once.
                         lastfunc[0] = astart
                     # zero-length hunk ranges report their start line as one less
                     if alen:
                         astart += 1
                     if blen:
                         bstart += 1
                     hunkrange = astart, alen, bstart, blen
                     hunklines = (
                         ["@@ -%d,%d +%d,%d @@%s\n" % (hunkrange + (func,))]
                         + delta
                         + [' ' + l1[x] for x in xrange(a2, aend)]
                     )
                     # If either file ends without a newline and the last line of
                     # that file is part of a hunk, a marker is printed. If the
                     # last line of both files is identical and neither ends in
                     # a newline, print only one marker. That's the only case in
                     # which the hunk can end in a shared line without a newline.
                     skip = False
                     if not t1.endswith('\n') and astart + alen == len(l1) + 1:
                         for i in xrange(len(hunklines) - 1, -1, -1):
                             if hunklines[i].startswith(('-', ' ')):
                                 if hunklines[i].startswith(' '):
                                     skip = True
                                 hunklines[i] += '\n'
                                 hunklines.insert(i + 1, _missing_newline_marker)
                                 break
                     if not skip and not t2.endswith('\n') and bstart + blen == len(l2) + 1:
                         for i in xrange(len(hunklines) - 1, -1, -1):
                             if hunklines[i].startswith('+'):
                                 hunklines[i] += '\n'
                                 hunklines.insert(i + 1, _missing_newline_marker)
                                 break
                     yield hunkrange, hunklines
                 # bdiff.blocks gives us the matching sequences in the files.  The loop
                 # below finds the spaces between those matching sequences and translates
                 # them into diff output.
                 #
                 hunk = None
                 ignoredlines = 0
                 has_hunks = False
                 for s, stype in allblocks(t1, t2, opts, l1, l2):
                     a1, a2, b1, b2 = s
                     if stype != '!':
                         if stype == '~':
                             # The diff context lines are based on t1 content. When
                             # blank lines are ignored, the new lines offsets must
                             # be adjusted as if equivalent blocks ('~') had the
                             # same sizes on both sides.
                             ignoredlines += (b2 - b1) - (a2 - a1)
                         continue
                     delta = []
                     old = l1[a1:a2]
                     new = l2[b1:b2]
                     b1 -= ignoredlines
                     b2 -= ignoredlines
                     astart = contextstart(a1)
                     bstart = contextstart(b1)
                     prev = None
                     if hunk:
                         # join with the previous hunk if it falls inside the context
                         if astart < hunk[1] + opts.context + 1:
                             prev = hunk
                             astart = hunk[1]
                             bstart = hunk[3]
                         else:
                             if not has_hunks:
                                 has_hunks = True
                                 yield True
                             for x in yieldhunk(hunk):
                                 yield x
                     if prev:
                         # we've joined the previous hunk, record the new ending points.
                         hunk[1] = a2
                         hunk[3] = b2
                         delta = hunk[4]
                     else:
                         # create a new hunk
                         hunk = [astart, a2, bstart, b2, delta]
                     delta[len(delta):] = [' ' + x for x in l1[astart:a1]]
                     delta[len(delta):] = ['-' + x for x in old]
                     delta[len(delta):] = ['+' + x for x in new]
                 if hunk:
                     if not has_hunks:
                         has_hunks = True
                         yield True
                     for x in yieldhunk(hunk):
                         yield x
                 elif not has_hunks:
                     yield False
             def b85diff(to, tn):
                 '''print base85-encoded binary diff'''
                 def fmtline(line):
                     l = len(line)
                     if l <= 26:
                         l = pycompat.bytechr(ord('A') + l - 1)
                     else:
                         l = pycompat.bytechr(l - 26 + ord('a') - 1)
                     return '%c%s\n' % (l, util.b85encode(line, True))
                 def chunk(text, csize=52):
                     l = len(text)
                     i = 0
                     while i < l:
                         yield text[i:i + csize]
                         i += csize
                 if to is None:
                     to = ''
                 if tn is None:
                     tn = ''
                 if to == tn:
                     return ''
                 # TODO: deltas
                 ret = []
                 ret.append('GIT binary patch\n')
                 ret.append('literal %d\n' % len(tn))
                 for l in chunk(zlib.compress(tn)):
                     ret.append(fmtline(l))
                 ret.append('\n')
                 return ''.join(ret)
             def patchtext(bin):
                 pos = 0
                 t = []
                 while pos < len(bin):
                     p1, p2, l = struct.unpack(">lll", bin[pos:pos + 12])
                     pos += 12
                     t.append(bin[pos:pos + l])
                     pos += l
                 return "".join(t)
             def patch(a, bin):
                 if len(a) == 0:
                     # skip over trivial delta header
                     return util.buffer(bin, 12)
                 return mpatch.patches(a, [bin])
             # similar to difflib.SequenceMatcher.get_matching_blocks
             def get_matching_blocks(a, b):
                 return [(d[0], d[2], d[1] - d[0]) for d in bdiff.blocks(a, b)]
             def trivialdiffheader(length):
                 return struct.pack(">lll", 0, 0, length) if length else ''
             def replacediffheader(oldlen, newlen):
                 return struct.pack(">lll", 0, oldlen, newlen)