##// END OF EJS Templates
patch: avoid repeated binary checks if all files in a patch are text...
Joerg Sonnenberger -
r35868:079b27b5 default
parent child Browse files
Show More
@@ -1,492 +1,495 b''
1 # mdiff.py - diff and patch routines for mercurial
1 # mdiff.py - diff and patch routines for mercurial
2 #
2 #
3 # Copyright 2005, 2006 Matt Mackall <mpm@selenic.com>
3 # Copyright 2005, 2006 Matt Mackall <mpm@selenic.com>
4 #
4 #
5 # This software may be used and distributed according to the terms of the
5 # This software may be used and distributed according to the terms of the
6 # GNU General Public License version 2 or any later version.
6 # GNU General Public License version 2 or any later version.
7
7
8 from __future__ import absolute_import
8 from __future__ import absolute_import
9
9
10 import re
10 import re
11 import struct
11 import struct
12 import zlib
12 import zlib
13
13
14 from .i18n import _
14 from .i18n import _
15 from . import (
15 from . import (
16 error,
16 error,
17 policy,
17 policy,
18 pycompat,
18 pycompat,
19 util,
19 util,
20 )
20 )
21
21
22 bdiff = policy.importmod(r'bdiff')
22 bdiff = policy.importmod(r'bdiff')
23 mpatch = policy.importmod(r'mpatch')
23 mpatch = policy.importmod(r'mpatch')
24
24
25 blocks = bdiff.blocks
25 blocks = bdiff.blocks
26 fixws = bdiff.fixws
26 fixws = bdiff.fixws
27 patches = mpatch.patches
27 patches = mpatch.patches
28 patchedsize = mpatch.patchedsize
28 patchedsize = mpatch.patchedsize
29 textdiff = bdiff.bdiff
29 textdiff = bdiff.bdiff
30
30
31 def splitnewlines(text):
31 def splitnewlines(text):
32 '''like str.splitlines, but only split on newlines.'''
32 '''like str.splitlines, but only split on newlines.'''
33 lines = [l + '\n' for l in text.split('\n')]
33 lines = [l + '\n' for l in text.split('\n')]
34 if lines:
34 if lines:
35 if lines[-1] == '\n':
35 if lines[-1] == '\n':
36 lines.pop()
36 lines.pop()
37 else:
37 else:
38 lines[-1] = lines[-1][:-1]
38 lines[-1] = lines[-1][:-1]
39 return lines
39 return lines
40
40
41 class diffopts(object):
41 class diffopts(object):
42 '''context is the number of context lines
42 '''context is the number of context lines
43 text treats all files as text
43 text treats all files as text
44 showfunc enables diff -p output
44 showfunc enables diff -p output
45 git enables the git extended patch format
45 git enables the git extended patch format
46 nodates removes dates from diff headers
46 nodates removes dates from diff headers
47 nobinary ignores binary files
47 nobinary ignores binary files
48 noprefix disables the 'a/' and 'b/' prefixes (ignored in plain mode)
48 noprefix disables the 'a/' and 'b/' prefixes (ignored in plain mode)
49 ignorews ignores all whitespace changes in the diff
49 ignorews ignores all whitespace changes in the diff
50 ignorewsamount ignores changes in the amount of whitespace
50 ignorewsamount ignores changes in the amount of whitespace
51 ignoreblanklines ignores changes whose lines are all blank
51 ignoreblanklines ignores changes whose lines are all blank
52 upgrade generates git diffs to avoid data loss
52 upgrade generates git diffs to avoid data loss
53 '''
53 '''
54
54
55 defaults = {
55 defaults = {
56 'context': 3,
56 'context': 3,
57 'text': False,
57 'text': False,
58 'showfunc': False,
58 'showfunc': False,
59 'git': False,
59 'git': False,
60 'nodates': False,
60 'nodates': False,
61 'nobinary': False,
61 'nobinary': False,
62 'noprefix': False,
62 'noprefix': False,
63 'index': 0,
63 'index': 0,
64 'ignorews': False,
64 'ignorews': False,
65 'ignorewsamount': False,
65 'ignorewsamount': False,
66 'ignorewseol': False,
66 'ignorewseol': False,
67 'ignoreblanklines': False,
67 'ignoreblanklines': False,
68 'upgrade': False,
68 'upgrade': False,
69 'showsimilarity': False,
69 'showsimilarity': False,
70 'worddiff': False,
70 'worddiff': False,
71 }
71 }
72
72
73 def __init__(self, **opts):
73 def __init__(self, **opts):
74 opts = pycompat.byteskwargs(opts)
74 opts = pycompat.byteskwargs(opts)
75 for k in self.defaults.keys():
75 for k in self.defaults.keys():
76 v = opts.get(k)
76 v = opts.get(k)
77 if v is None:
77 if v is None:
78 v = self.defaults[k]
78 v = self.defaults[k]
79 setattr(self, k, v)
79 setattr(self, k, v)
80
80
81 try:
81 try:
82 self.context = int(self.context)
82 self.context = int(self.context)
83 except ValueError:
83 except ValueError:
84 raise error.Abort(_('diff context lines count must be '
84 raise error.Abort(_('diff context lines count must be '
85 'an integer, not %r') % self.context)
85 'an integer, not %r') % self.context)
86
86
87 def copy(self, **kwargs):
87 def copy(self, **kwargs):
88 opts = dict((k, getattr(self, k)) for k in self.defaults)
88 opts = dict((k, getattr(self, k)) for k in self.defaults)
89 opts = pycompat.strkwargs(opts)
89 opts = pycompat.strkwargs(opts)
90 opts.update(kwargs)
90 opts.update(kwargs)
91 return diffopts(**opts)
91 return diffopts(**opts)
92
92
93 defaultopts = diffopts()
93 defaultopts = diffopts()
94
94
95 def wsclean(opts, text, blank=True):
95 def wsclean(opts, text, blank=True):
96 if opts.ignorews:
96 if opts.ignorews:
97 text = bdiff.fixws(text, 1)
97 text = bdiff.fixws(text, 1)
98 elif opts.ignorewsamount:
98 elif opts.ignorewsamount:
99 text = bdiff.fixws(text, 0)
99 text = bdiff.fixws(text, 0)
100 if blank and opts.ignoreblanklines:
100 if blank and opts.ignoreblanklines:
101 text = re.sub('\n+', '\n', text).strip('\n')
101 text = re.sub('\n+', '\n', text).strip('\n')
102 if opts.ignorewseol:
102 if opts.ignorewseol:
103 text = re.sub(br'[ \t\r\f]+\n', r'\n', text)
103 text = re.sub(br'[ \t\r\f]+\n', r'\n', text)
104 return text
104 return text
105
105
106 def splitblock(base1, lines1, base2, lines2, opts):
106 def splitblock(base1, lines1, base2, lines2, opts):
107 # The input lines matches except for interwoven blank lines. We
107 # The input lines matches except for interwoven blank lines. We
108 # transform it into a sequence of matching blocks and blank blocks.
108 # transform it into a sequence of matching blocks and blank blocks.
109 lines1 = [(wsclean(opts, l) and 1 or 0) for l in lines1]
109 lines1 = [(wsclean(opts, l) and 1 or 0) for l in lines1]
110 lines2 = [(wsclean(opts, l) and 1 or 0) for l in lines2]
110 lines2 = [(wsclean(opts, l) and 1 or 0) for l in lines2]
111 s1, e1 = 0, len(lines1)
111 s1, e1 = 0, len(lines1)
112 s2, e2 = 0, len(lines2)
112 s2, e2 = 0, len(lines2)
113 while s1 < e1 or s2 < e2:
113 while s1 < e1 or s2 < e2:
114 i1, i2, btype = s1, s2, '='
114 i1, i2, btype = s1, s2, '='
115 if (i1 >= e1 or lines1[i1] == 0
115 if (i1 >= e1 or lines1[i1] == 0
116 or i2 >= e2 or lines2[i2] == 0):
116 or i2 >= e2 or lines2[i2] == 0):
117 # Consume the block of blank lines
117 # Consume the block of blank lines
118 btype = '~'
118 btype = '~'
119 while i1 < e1 and lines1[i1] == 0:
119 while i1 < e1 and lines1[i1] == 0:
120 i1 += 1
120 i1 += 1
121 while i2 < e2 and lines2[i2] == 0:
121 while i2 < e2 and lines2[i2] == 0:
122 i2 += 1
122 i2 += 1
123 else:
123 else:
124 # Consume the matching lines
124 # Consume the matching lines
125 while i1 < e1 and lines1[i1] == 1 and lines2[i2] == 1:
125 while i1 < e1 and lines1[i1] == 1 and lines2[i2] == 1:
126 i1 += 1
126 i1 += 1
127 i2 += 1
127 i2 += 1
128 yield [base1 + s1, base1 + i1, base2 + s2, base2 + i2], btype
128 yield [base1 + s1, base1 + i1, base2 + s2, base2 + i2], btype
129 s1 = i1
129 s1 = i1
130 s2 = i2
130 s2 = i2
131
131
132 def hunkinrange(hunk, linerange):
132 def hunkinrange(hunk, linerange):
133 """Return True if `hunk` defined as (start, length) is in `linerange`
133 """Return True if `hunk` defined as (start, length) is in `linerange`
134 defined as (lowerbound, upperbound).
134 defined as (lowerbound, upperbound).
135
135
136 >>> hunkinrange((5, 10), (2, 7))
136 >>> hunkinrange((5, 10), (2, 7))
137 True
137 True
138 >>> hunkinrange((5, 10), (6, 12))
138 >>> hunkinrange((5, 10), (6, 12))
139 True
139 True
140 >>> hunkinrange((5, 10), (13, 17))
140 >>> hunkinrange((5, 10), (13, 17))
141 True
141 True
142 >>> hunkinrange((5, 10), (3, 17))
142 >>> hunkinrange((5, 10), (3, 17))
143 True
143 True
144 >>> hunkinrange((5, 10), (1, 3))
144 >>> hunkinrange((5, 10), (1, 3))
145 False
145 False
146 >>> hunkinrange((5, 10), (18, 20))
146 >>> hunkinrange((5, 10), (18, 20))
147 False
147 False
148 >>> hunkinrange((5, 10), (1, 5))
148 >>> hunkinrange((5, 10), (1, 5))
149 False
149 False
150 >>> hunkinrange((5, 10), (15, 27))
150 >>> hunkinrange((5, 10), (15, 27))
151 False
151 False
152 """
152 """
153 start, length = hunk
153 start, length = hunk
154 lowerbound, upperbound = linerange
154 lowerbound, upperbound = linerange
155 return lowerbound < start + length and start < upperbound
155 return lowerbound < start + length and start < upperbound
156
156
157 def blocksinrange(blocks, rangeb):
157 def blocksinrange(blocks, rangeb):
158 """filter `blocks` like (a1, a2, b1, b2) from items outside line range
158 """filter `blocks` like (a1, a2, b1, b2) from items outside line range
159 `rangeb` from ``(b1, b2)`` point of view.
159 `rangeb` from ``(b1, b2)`` point of view.
160
160
161 Return `filteredblocks, rangea` where:
161 Return `filteredblocks, rangea` where:
162
162
163 * `filteredblocks` is list of ``block = (a1, a2, b1, b2), stype`` items of
163 * `filteredblocks` is list of ``block = (a1, a2, b1, b2), stype`` items of
164 `blocks` that are inside `rangeb` from ``(b1, b2)`` point of view; a
164 `blocks` that are inside `rangeb` from ``(b1, b2)`` point of view; a
165 block ``(b1, b2)`` being inside `rangeb` if
165 block ``(b1, b2)`` being inside `rangeb` if
166 ``rangeb[0] < b2 and b1 < rangeb[1]``;
166 ``rangeb[0] < b2 and b1 < rangeb[1]``;
167 * `rangea` is the line range w.r.t. to ``(a1, a2)`` parts of `blocks`.
167 * `rangea` is the line range w.r.t. to ``(a1, a2)`` parts of `blocks`.
168 """
168 """
169 lbb, ubb = rangeb
169 lbb, ubb = rangeb
170 lba, uba = None, None
170 lba, uba = None, None
171 filteredblocks = []
171 filteredblocks = []
172 for block in blocks:
172 for block in blocks:
173 (a1, a2, b1, b2), stype = block
173 (a1, a2, b1, b2), stype = block
174 if lbb >= b1 and ubb <= b2 and stype == '=':
174 if lbb >= b1 and ubb <= b2 and stype == '=':
175 # rangeb is within a single "=" hunk, restrict back linerange1
175 # rangeb is within a single "=" hunk, restrict back linerange1
176 # by offsetting rangeb
176 # by offsetting rangeb
177 lba = lbb - b1 + a1
177 lba = lbb - b1 + a1
178 uba = ubb - b1 + a1
178 uba = ubb - b1 + a1
179 else:
179 else:
180 if b1 <= lbb < b2:
180 if b1 <= lbb < b2:
181 if stype == '=':
181 if stype == '=':
182 lba = a2 - (b2 - lbb)
182 lba = a2 - (b2 - lbb)
183 else:
183 else:
184 lba = a1
184 lba = a1
185 if b1 < ubb <= b2:
185 if b1 < ubb <= b2:
186 if stype == '=':
186 if stype == '=':
187 uba = a1 + (ubb - b1)
187 uba = a1 + (ubb - b1)
188 else:
188 else:
189 uba = a2
189 uba = a2
190 if hunkinrange((b1, (b2 - b1)), rangeb):
190 if hunkinrange((b1, (b2 - b1)), rangeb):
191 filteredblocks.append(block)
191 filteredblocks.append(block)
192 if lba is None or uba is None or uba < lba:
192 if lba is None or uba is None or uba < lba:
193 raise error.Abort(_('line range exceeds file size'))
193 raise error.Abort(_('line range exceeds file size'))
194 return filteredblocks, (lba, uba)
194 return filteredblocks, (lba, uba)
195
195
196 def allblocks(text1, text2, opts=None, lines1=None, lines2=None):
196 def allblocks(text1, text2, opts=None, lines1=None, lines2=None):
197 """Return (block, type) tuples, where block is an mdiff.blocks
197 """Return (block, type) tuples, where block is an mdiff.blocks
198 line entry. type is '=' for blocks matching exactly one another
198 line entry. type is '=' for blocks matching exactly one another
199 (bdiff blocks), '!' for non-matching blocks and '~' for blocks
199 (bdiff blocks), '!' for non-matching blocks and '~' for blocks
200 matching only after having filtered blank lines.
200 matching only after having filtered blank lines.
201 line1 and line2 are text1 and text2 split with splitnewlines() if
201 line1 and line2 are text1 and text2 split with splitnewlines() if
202 they are already available.
202 they are already available.
203 """
203 """
204 if opts is None:
204 if opts is None:
205 opts = defaultopts
205 opts = defaultopts
206 if opts.ignorews or opts.ignorewsamount or opts.ignorewseol:
206 if opts.ignorews or opts.ignorewsamount or opts.ignorewseol:
207 text1 = wsclean(opts, text1, False)
207 text1 = wsclean(opts, text1, False)
208 text2 = wsclean(opts, text2, False)
208 text2 = wsclean(opts, text2, False)
209 diff = bdiff.blocks(text1, text2)
209 diff = bdiff.blocks(text1, text2)
210 for i, s1 in enumerate(diff):
210 for i, s1 in enumerate(diff):
211 # The first match is special.
211 # The first match is special.
212 # we've either found a match starting at line 0 or a match later
212 # we've either found a match starting at line 0 or a match later
213 # in the file. If it starts later, old and new below will both be
213 # in the file. If it starts later, old and new below will both be
214 # empty and we'll continue to the next match.
214 # empty and we'll continue to the next match.
215 if i > 0:
215 if i > 0:
216 s = diff[i - 1]
216 s = diff[i - 1]
217 else:
217 else:
218 s = [0, 0, 0, 0]
218 s = [0, 0, 0, 0]
219 s = [s[1], s1[0], s[3], s1[2]]
219 s = [s[1], s1[0], s[3], s1[2]]
220
220
221 # bdiff sometimes gives huge matches past eof, this check eats them,
221 # bdiff sometimes gives huge matches past eof, this check eats them,
222 # and deals with the special first match case described above
222 # and deals with the special first match case described above
223 if s[0] != s[1] or s[2] != s[3]:
223 if s[0] != s[1] or s[2] != s[3]:
224 type = '!'
224 type = '!'
225 if opts.ignoreblanklines:
225 if opts.ignoreblanklines:
226 if lines1 is None:
226 if lines1 is None:
227 lines1 = splitnewlines(text1)
227 lines1 = splitnewlines(text1)
228 if lines2 is None:
228 if lines2 is None:
229 lines2 = splitnewlines(text2)
229 lines2 = splitnewlines(text2)
230 old = wsclean(opts, "".join(lines1[s[0]:s[1]]))
230 old = wsclean(opts, "".join(lines1[s[0]:s[1]]))
231 new = wsclean(opts, "".join(lines2[s[2]:s[3]]))
231 new = wsclean(opts, "".join(lines2[s[2]:s[3]]))
232 if old == new:
232 if old == new:
233 type = '~'
233 type = '~'
234 yield s, type
234 yield s, type
235 yield s1, '='
235 yield s1, '='
236
236
237 def unidiff(a, ad, b, bd, fn1, fn2, opts=defaultopts):
237 def unidiff(a, ad, b, bd, fn1, fn2, opts=defaultopts, check_binary=True):
238 """Return a unified diff as a (headers, hunks) tuple.
238 """Return a unified diff as a (headers, hunks) tuple.
239
239
240 If the diff is not null, `headers` is a list with unified diff header
240 If the diff is not null, `headers` is a list with unified diff header
241 lines "--- <original>" and "+++ <new>" and `hunks` is a generator yielding
241 lines "--- <original>" and "+++ <new>" and `hunks` is a generator yielding
242 (hunkrange, hunklines) coming from _unidiff().
242 (hunkrange, hunklines) coming from _unidiff().
243 Otherwise, `headers` and `hunks` are empty.
243 Otherwise, `headers` and `hunks` are empty.
244
245 Setting `check_binary` to false will skip the binary check, i.e. when
246 it has been done in advance. Files are expected to be text in this case.
244 """
247 """
245 def datetag(date, fn=None):
248 def datetag(date, fn=None):
246 if not opts.git and not opts.nodates:
249 if not opts.git and not opts.nodates:
247 return '\t%s' % date
250 return '\t%s' % date
248 if fn and ' ' in fn:
251 if fn and ' ' in fn:
249 return '\t'
252 return '\t'
250 return ''
253 return ''
251
254
252 sentinel = [], ()
255 sentinel = [], ()
253 if not a and not b:
256 if not a and not b:
254 return sentinel
257 return sentinel
255
258
256 if opts.noprefix:
259 if opts.noprefix:
257 aprefix = bprefix = ''
260 aprefix = bprefix = ''
258 else:
261 else:
259 aprefix = 'a/'
262 aprefix = 'a/'
260 bprefix = 'b/'
263 bprefix = 'b/'
261
264
262 epoch = util.datestr((0, 0))
265 epoch = util.datestr((0, 0))
263
266
264 fn1 = util.pconvert(fn1)
267 fn1 = util.pconvert(fn1)
265 fn2 = util.pconvert(fn2)
268 fn2 = util.pconvert(fn2)
266
269
267 def checknonewline(lines):
270 def checknonewline(lines):
268 for text in lines:
271 for text in lines:
269 if text[-1:] != '\n':
272 if text[-1:] != '\n':
270 text += "\n\ No newline at end of file\n"
273 text += "\n\ No newline at end of file\n"
271 yield text
274 yield text
272
275
273 if not opts.text and (util.binary(a) or util.binary(b)):
276 if not opts.text and check_binary and (util.binary(a) or util.binary(b)):
274 if a and b and len(a) == len(b) and a == b:
277 if a and b and len(a) == len(b) and a == b:
275 return sentinel
278 return sentinel
276 headerlines = []
279 headerlines = []
277 hunks = (None, ['Binary file %s has changed\n' % fn1]),
280 hunks = (None, ['Binary file %s has changed\n' % fn1]),
278 elif not a:
281 elif not a:
279 b = splitnewlines(b)
282 b = splitnewlines(b)
280 if a is None:
283 if a is None:
281 l1 = '--- /dev/null%s' % datetag(epoch)
284 l1 = '--- /dev/null%s' % datetag(epoch)
282 else:
285 else:
283 l1 = "--- %s%s%s" % (aprefix, fn1, datetag(ad, fn1))
286 l1 = "--- %s%s%s" % (aprefix, fn1, datetag(ad, fn1))
284 l2 = "+++ %s%s" % (bprefix + fn2, datetag(bd, fn2))
287 l2 = "+++ %s%s" % (bprefix + fn2, datetag(bd, fn2))
285 headerlines = [l1, l2]
288 headerlines = [l1, l2]
286 size = len(b)
289 size = len(b)
287 hunkrange = (0, 0, 1, size)
290 hunkrange = (0, 0, 1, size)
288 hunklines = ["@@ -0,0 +1,%d @@\n" % size] + ["+" + e for e in b]
291 hunklines = ["@@ -0,0 +1,%d @@\n" % size] + ["+" + e for e in b]
289 hunks = (hunkrange, checknonewline(hunklines)),
292 hunks = (hunkrange, checknonewline(hunklines)),
290 elif not b:
293 elif not b:
291 a = splitnewlines(a)
294 a = splitnewlines(a)
292 l1 = "--- %s%s%s" % (aprefix, fn1, datetag(ad, fn1))
295 l1 = "--- %s%s%s" % (aprefix, fn1, datetag(ad, fn1))
293 if b is None:
296 if b is None:
294 l2 = '+++ /dev/null%s' % datetag(epoch)
297 l2 = '+++ /dev/null%s' % datetag(epoch)
295 else:
298 else:
296 l2 = "+++ %s%s%s" % (bprefix, fn2, datetag(bd, fn2))
299 l2 = "+++ %s%s%s" % (bprefix, fn2, datetag(bd, fn2))
297 headerlines = [l1, l2]
300 headerlines = [l1, l2]
298 size = len(a)
301 size = len(a)
299 hunkrange = (1, size, 0, 0)
302 hunkrange = (1, size, 0, 0)
300 hunklines = ["@@ -1,%d +0,0 @@\n" % size] + ["-" + e for e in a]
303 hunklines = ["@@ -1,%d +0,0 @@\n" % size] + ["-" + e for e in a]
301 hunks = (hunkrange, checknonewline(hunklines)),
304 hunks = (hunkrange, checknonewline(hunklines)),
302 else:
305 else:
303 diffhunks = _unidiff(a, b, opts=opts)
306 diffhunks = _unidiff(a, b, opts=opts)
304 try:
307 try:
305 hunkrange, hunklines = next(diffhunks)
308 hunkrange, hunklines = next(diffhunks)
306 except StopIteration:
309 except StopIteration:
307 return sentinel
310 return sentinel
308
311
309 headerlines = [
312 headerlines = [
310 "--- %s%s%s" % (aprefix, fn1, datetag(ad, fn1)),
313 "--- %s%s%s" % (aprefix, fn1, datetag(ad, fn1)),
311 "+++ %s%s%s" % (bprefix, fn2, datetag(bd, fn2)),
314 "+++ %s%s%s" % (bprefix, fn2, datetag(bd, fn2)),
312 ]
315 ]
313 def rewindhunks():
316 def rewindhunks():
314 yield hunkrange, checknonewline(hunklines)
317 yield hunkrange, checknonewline(hunklines)
315 for hr, hl in diffhunks:
318 for hr, hl in diffhunks:
316 yield hr, checknonewline(hl)
319 yield hr, checknonewline(hl)
317
320
318 hunks = rewindhunks()
321 hunks = rewindhunks()
319
322
320 return headerlines, hunks
323 return headerlines, hunks
321
324
322 def _unidiff(t1, t2, opts=defaultopts):
325 def _unidiff(t1, t2, opts=defaultopts):
323 """Yield hunks of a headerless unified diff from t1 and t2 texts.
326 """Yield hunks of a headerless unified diff from t1 and t2 texts.
324
327
325 Each hunk consists of a (hunkrange, hunklines) tuple where `hunkrange` is a
328 Each hunk consists of a (hunkrange, hunklines) tuple where `hunkrange` is a
326 tuple (s1, l1, s2, l2) representing the range information of the hunk to
329 tuple (s1, l1, s2, l2) representing the range information of the hunk to
327 form the '@@ -s1,l1 +s2,l2 @@' header and `hunklines` is a list of lines
330 form the '@@ -s1,l1 +s2,l2 @@' header and `hunklines` is a list of lines
328 of the hunk combining said header followed by line additions and
331 of the hunk combining said header followed by line additions and
329 deletions.
332 deletions.
330 """
333 """
331 l1 = splitnewlines(t1)
334 l1 = splitnewlines(t1)
332 l2 = splitnewlines(t2)
335 l2 = splitnewlines(t2)
333 def contextend(l, len):
336 def contextend(l, len):
334 ret = l + opts.context
337 ret = l + opts.context
335 if ret > len:
338 if ret > len:
336 ret = len
339 ret = len
337 return ret
340 return ret
338
341
339 def contextstart(l):
342 def contextstart(l):
340 ret = l - opts.context
343 ret = l - opts.context
341 if ret < 0:
344 if ret < 0:
342 return 0
345 return 0
343 return ret
346 return ret
344
347
345 lastfunc = [0, '']
348 lastfunc = [0, '']
346 def yieldhunk(hunk):
349 def yieldhunk(hunk):
347 (astart, a2, bstart, b2, delta) = hunk
350 (astart, a2, bstart, b2, delta) = hunk
348 aend = contextend(a2, len(l1))
351 aend = contextend(a2, len(l1))
349 alen = aend - astart
352 alen = aend - astart
350 blen = b2 - bstart + aend - a2
353 blen = b2 - bstart + aend - a2
351
354
352 func = ""
355 func = ""
353 if opts.showfunc:
356 if opts.showfunc:
354 lastpos, func = lastfunc
357 lastpos, func = lastfunc
355 # walk backwards from the start of the context up to the start of
358 # walk backwards from the start of the context up to the start of
356 # the previous hunk context until we find a line starting with an
359 # the previous hunk context until we find a line starting with an
357 # alphanumeric char.
360 # alphanumeric char.
358 for i in xrange(astart - 1, lastpos - 1, -1):
361 for i in xrange(astart - 1, lastpos - 1, -1):
359 if l1[i][0:1].isalnum():
362 if l1[i][0:1].isalnum():
360 func = ' ' + l1[i].rstrip()[:40]
363 func = ' ' + l1[i].rstrip()[:40]
361 lastfunc[1] = func
364 lastfunc[1] = func
362 break
365 break
363 # by recording this hunk's starting point as the next place to
366 # by recording this hunk's starting point as the next place to
364 # start looking for function lines, we avoid reading any line in
367 # start looking for function lines, we avoid reading any line in
365 # the file more than once.
368 # the file more than once.
366 lastfunc[0] = astart
369 lastfunc[0] = astart
367
370
368 # zero-length hunk ranges report their start line as one less
371 # zero-length hunk ranges report their start line as one less
369 if alen:
372 if alen:
370 astart += 1
373 astart += 1
371 if blen:
374 if blen:
372 bstart += 1
375 bstart += 1
373
376
374 hunkrange = astart, alen, bstart, blen
377 hunkrange = astart, alen, bstart, blen
375 hunklines = (
378 hunklines = (
376 ["@@ -%d,%d +%d,%d @@%s\n" % (hunkrange + (func,))]
379 ["@@ -%d,%d +%d,%d @@%s\n" % (hunkrange + (func,))]
377 + delta
380 + delta
378 + [' ' + l1[x] for x in xrange(a2, aend)]
381 + [' ' + l1[x] for x in xrange(a2, aend)]
379 )
382 )
380 yield hunkrange, hunklines
383 yield hunkrange, hunklines
381
384
382 # bdiff.blocks gives us the matching sequences in the files. The loop
385 # bdiff.blocks gives us the matching sequences in the files. The loop
383 # below finds the spaces between those matching sequences and translates
386 # below finds the spaces between those matching sequences and translates
384 # them into diff output.
387 # them into diff output.
385 #
388 #
386 hunk = None
389 hunk = None
387 ignoredlines = 0
390 ignoredlines = 0
388 for s, stype in allblocks(t1, t2, opts, l1, l2):
391 for s, stype in allblocks(t1, t2, opts, l1, l2):
389 a1, a2, b1, b2 = s
392 a1, a2, b1, b2 = s
390 if stype != '!':
393 if stype != '!':
391 if stype == '~':
394 if stype == '~':
392 # The diff context lines are based on t1 content. When
395 # The diff context lines are based on t1 content. When
393 # blank lines are ignored, the new lines offsets must
396 # blank lines are ignored, the new lines offsets must
394 # be adjusted as if equivalent blocks ('~') had the
397 # be adjusted as if equivalent blocks ('~') had the
395 # same sizes on both sides.
398 # same sizes on both sides.
396 ignoredlines += (b2 - b1) - (a2 - a1)
399 ignoredlines += (b2 - b1) - (a2 - a1)
397 continue
400 continue
398 delta = []
401 delta = []
399 old = l1[a1:a2]
402 old = l1[a1:a2]
400 new = l2[b1:b2]
403 new = l2[b1:b2]
401
404
402 b1 -= ignoredlines
405 b1 -= ignoredlines
403 b2 -= ignoredlines
406 b2 -= ignoredlines
404 astart = contextstart(a1)
407 astart = contextstart(a1)
405 bstart = contextstart(b1)
408 bstart = contextstart(b1)
406 prev = None
409 prev = None
407 if hunk:
410 if hunk:
408 # join with the previous hunk if it falls inside the context
411 # join with the previous hunk if it falls inside the context
409 if astart < hunk[1] + opts.context + 1:
412 if astart < hunk[1] + opts.context + 1:
410 prev = hunk
413 prev = hunk
411 astart = hunk[1]
414 astart = hunk[1]
412 bstart = hunk[3]
415 bstart = hunk[3]
413 else:
416 else:
414 for x in yieldhunk(hunk):
417 for x in yieldhunk(hunk):
415 yield x
418 yield x
416 if prev:
419 if prev:
417 # we've joined the previous hunk, record the new ending points.
420 # we've joined the previous hunk, record the new ending points.
418 hunk[1] = a2
421 hunk[1] = a2
419 hunk[3] = b2
422 hunk[3] = b2
420 delta = hunk[4]
423 delta = hunk[4]
421 else:
424 else:
422 # create a new hunk
425 # create a new hunk
423 hunk = [astart, a2, bstart, b2, delta]
426 hunk = [astart, a2, bstart, b2, delta]
424
427
425 delta[len(delta):] = [' ' + x for x in l1[astart:a1]]
428 delta[len(delta):] = [' ' + x for x in l1[astart:a1]]
426 delta[len(delta):] = ['-' + x for x in old]
429 delta[len(delta):] = ['-' + x for x in old]
427 delta[len(delta):] = ['+' + x for x in new]
430 delta[len(delta):] = ['+' + x for x in new]
428
431
429 if hunk:
432 if hunk:
430 for x in yieldhunk(hunk):
433 for x in yieldhunk(hunk):
431 yield x
434 yield x
432
435
433 def b85diff(to, tn):
436 def b85diff(to, tn):
434 '''print base85-encoded binary diff'''
437 '''print base85-encoded binary diff'''
435 def fmtline(line):
438 def fmtline(line):
436 l = len(line)
439 l = len(line)
437 if l <= 26:
440 if l <= 26:
438 l = chr(ord('A') + l - 1)
441 l = chr(ord('A') + l - 1)
439 else:
442 else:
440 l = chr(l - 26 + ord('a') - 1)
443 l = chr(l - 26 + ord('a') - 1)
441 return '%c%s\n' % (l, util.b85encode(line, True))
444 return '%c%s\n' % (l, util.b85encode(line, True))
442
445
443 def chunk(text, csize=52):
446 def chunk(text, csize=52):
444 l = len(text)
447 l = len(text)
445 i = 0
448 i = 0
446 while i < l:
449 while i < l:
447 yield text[i:i + csize]
450 yield text[i:i + csize]
448 i += csize
451 i += csize
449
452
450 if to is None:
453 if to is None:
451 to = ''
454 to = ''
452 if tn is None:
455 if tn is None:
453 tn = ''
456 tn = ''
454
457
455 if to == tn:
458 if to == tn:
456 return ''
459 return ''
457
460
458 # TODO: deltas
461 # TODO: deltas
459 ret = []
462 ret = []
460 ret.append('GIT binary patch\n')
463 ret.append('GIT binary patch\n')
461 ret.append('literal %d\n' % len(tn))
464 ret.append('literal %d\n' % len(tn))
462 for l in chunk(zlib.compress(tn)):
465 for l in chunk(zlib.compress(tn)):
463 ret.append(fmtline(l))
466 ret.append(fmtline(l))
464 ret.append('\n')
467 ret.append('\n')
465
468
466 return ''.join(ret)
469 return ''.join(ret)
467
470
468 def patchtext(bin):
471 def patchtext(bin):
469 pos = 0
472 pos = 0
470 t = []
473 t = []
471 while pos < len(bin):
474 while pos < len(bin):
472 p1, p2, l = struct.unpack(">lll", bin[pos:pos + 12])
475 p1, p2, l = struct.unpack(">lll", bin[pos:pos + 12])
473 pos += 12
476 pos += 12
474 t.append(bin[pos:pos + l])
477 t.append(bin[pos:pos + l])
475 pos += l
478 pos += l
476 return "".join(t)
479 return "".join(t)
477
480
478 def patch(a, bin):
481 def patch(a, bin):
479 if len(a) == 0:
482 if len(a) == 0:
480 # skip over trivial delta header
483 # skip over trivial delta header
481 return util.buffer(bin, 12)
484 return util.buffer(bin, 12)
482 return mpatch.patches(a, [bin])
485 return mpatch.patches(a, [bin])
483
486
484 # similar to difflib.SequenceMatcher.get_matching_blocks
487 # similar to difflib.SequenceMatcher.get_matching_blocks
485 def get_matching_blocks(a, b):
488 def get_matching_blocks(a, b):
486 return [(d[0], d[2], d[1] - d[0]) for d in bdiff.blocks(a, b)]
489 return [(d[0], d[2], d[1] - d[0]) for d in bdiff.blocks(a, b)]
487
490
488 def trivialdiffheader(length):
491 def trivialdiffheader(length):
489 return struct.pack(">lll", 0, 0, length) if length else ''
492 return struct.pack(">lll", 0, 0, length) if length else ''
490
493
491 def replacediffheader(oldlen, newlen):
494 def replacediffheader(oldlen, newlen):
492 return struct.pack(">lll", 0, oldlen, newlen)
495 return struct.pack(">lll", 0, oldlen, newlen)
@@ -1,2901 +1,2907 b''
1 # patch.py - patch file parsing routines
1 # patch.py - patch file parsing routines
2 #
2 #
3 # Copyright 2006 Brendan Cully <brendan@kublai.com>
3 # Copyright 2006 Brendan Cully <brendan@kublai.com>
4 # Copyright 2007 Chris Mason <chris.mason@oracle.com>
4 # Copyright 2007 Chris Mason <chris.mason@oracle.com>
5 #
5 #
6 # This software may be used and distributed according to the terms of the
6 # This software may be used and distributed according to the terms of the
7 # GNU General Public License version 2 or any later version.
7 # GNU General Public License version 2 or any later version.
8
8
9 from __future__ import absolute_import, print_function
9 from __future__ import absolute_import, print_function
10
10
11 import collections
11 import collections
12 import copy
12 import copy
13 import difflib
13 import difflib
14 import email
14 import email
15 import email.parser as emailparser
15 import email.parser as emailparser
16 import errno
16 import errno
17 import hashlib
17 import hashlib
18 import os
18 import os
19 import posixpath
19 import posixpath
20 import re
20 import re
21 import shutil
21 import shutil
22 import tempfile
22 import tempfile
23 import zlib
23 import zlib
24
24
25 from .i18n import _
25 from .i18n import _
26 from .node import (
26 from .node import (
27 hex,
27 hex,
28 short,
28 short,
29 )
29 )
30 from . import (
30 from . import (
31 copies,
31 copies,
32 encoding,
32 encoding,
33 error,
33 error,
34 mail,
34 mail,
35 mdiff,
35 mdiff,
36 pathutil,
36 pathutil,
37 policy,
37 policy,
38 pycompat,
38 pycompat,
39 scmutil,
39 scmutil,
40 similar,
40 similar,
41 util,
41 util,
42 vfs as vfsmod,
42 vfs as vfsmod,
43 )
43 )
44
44
45 diffhelpers = policy.importmod(r'diffhelpers')
45 diffhelpers = policy.importmod(r'diffhelpers')
46 stringio = util.stringio
46 stringio = util.stringio
47
47
48 gitre = re.compile(br'diff --git a/(.*) b/(.*)')
48 gitre = re.compile(br'diff --git a/(.*) b/(.*)')
49 tabsplitter = re.compile(br'(\t+|[^\t]+)')
49 tabsplitter = re.compile(br'(\t+|[^\t]+)')
50 _nonwordre = re.compile(br'([^a-zA-Z0-9_\x80-\xff])')
50 _nonwordre = re.compile(br'([^a-zA-Z0-9_\x80-\xff])')
51
51
52 PatchError = error.PatchError
52 PatchError = error.PatchError
53
53
54 # public functions
54 # public functions
55
55
56 def split(stream):
56 def split(stream):
57 '''return an iterator of individual patches from a stream'''
57 '''return an iterator of individual patches from a stream'''
58 def isheader(line, inheader):
58 def isheader(line, inheader):
59 if inheader and line[0] in (' ', '\t'):
59 if inheader and line[0] in (' ', '\t'):
60 # continuation
60 # continuation
61 return True
61 return True
62 if line[0] in (' ', '-', '+'):
62 if line[0] in (' ', '-', '+'):
63 # diff line - don't check for header pattern in there
63 # diff line - don't check for header pattern in there
64 return False
64 return False
65 l = line.split(': ', 1)
65 l = line.split(': ', 1)
66 return len(l) == 2 and ' ' not in l[0]
66 return len(l) == 2 and ' ' not in l[0]
67
67
68 def chunk(lines):
68 def chunk(lines):
69 return stringio(''.join(lines))
69 return stringio(''.join(lines))
70
70
71 def hgsplit(stream, cur):
71 def hgsplit(stream, cur):
72 inheader = True
72 inheader = True
73
73
74 for line in stream:
74 for line in stream:
75 if not line.strip():
75 if not line.strip():
76 inheader = False
76 inheader = False
77 if not inheader and line.startswith('# HG changeset patch'):
77 if not inheader and line.startswith('# HG changeset patch'):
78 yield chunk(cur)
78 yield chunk(cur)
79 cur = []
79 cur = []
80 inheader = True
80 inheader = True
81
81
82 cur.append(line)
82 cur.append(line)
83
83
84 if cur:
84 if cur:
85 yield chunk(cur)
85 yield chunk(cur)
86
86
87 def mboxsplit(stream, cur):
87 def mboxsplit(stream, cur):
88 for line in stream:
88 for line in stream:
89 if line.startswith('From '):
89 if line.startswith('From '):
90 for c in split(chunk(cur[1:])):
90 for c in split(chunk(cur[1:])):
91 yield c
91 yield c
92 cur = []
92 cur = []
93
93
94 cur.append(line)
94 cur.append(line)
95
95
96 if cur:
96 if cur:
97 for c in split(chunk(cur[1:])):
97 for c in split(chunk(cur[1:])):
98 yield c
98 yield c
99
99
100 def mimesplit(stream, cur):
100 def mimesplit(stream, cur):
101 def msgfp(m):
101 def msgfp(m):
102 fp = stringio()
102 fp = stringio()
103 g = email.Generator.Generator(fp, mangle_from_=False)
103 g = email.Generator.Generator(fp, mangle_from_=False)
104 g.flatten(m)
104 g.flatten(m)
105 fp.seek(0)
105 fp.seek(0)
106 return fp
106 return fp
107
107
108 for line in stream:
108 for line in stream:
109 cur.append(line)
109 cur.append(line)
110 c = chunk(cur)
110 c = chunk(cur)
111
111
112 m = emailparser.Parser().parse(c)
112 m = emailparser.Parser().parse(c)
113 if not m.is_multipart():
113 if not m.is_multipart():
114 yield msgfp(m)
114 yield msgfp(m)
115 else:
115 else:
116 ok_types = ('text/plain', 'text/x-diff', 'text/x-patch')
116 ok_types = ('text/plain', 'text/x-diff', 'text/x-patch')
117 for part in m.walk():
117 for part in m.walk():
118 ct = part.get_content_type()
118 ct = part.get_content_type()
119 if ct not in ok_types:
119 if ct not in ok_types:
120 continue
120 continue
121 yield msgfp(part)
121 yield msgfp(part)
122
122
123 def headersplit(stream, cur):
123 def headersplit(stream, cur):
124 inheader = False
124 inheader = False
125
125
126 for line in stream:
126 for line in stream:
127 if not inheader and isheader(line, inheader):
127 if not inheader and isheader(line, inheader):
128 yield chunk(cur)
128 yield chunk(cur)
129 cur = []
129 cur = []
130 inheader = True
130 inheader = True
131 if inheader and not isheader(line, inheader):
131 if inheader and not isheader(line, inheader):
132 inheader = False
132 inheader = False
133
133
134 cur.append(line)
134 cur.append(line)
135
135
136 if cur:
136 if cur:
137 yield chunk(cur)
137 yield chunk(cur)
138
138
139 def remainder(cur):
139 def remainder(cur):
140 yield chunk(cur)
140 yield chunk(cur)
141
141
142 class fiter(object):
142 class fiter(object):
143 def __init__(self, fp):
143 def __init__(self, fp):
144 self.fp = fp
144 self.fp = fp
145
145
146 def __iter__(self):
146 def __iter__(self):
147 return self
147 return self
148
148
149 def next(self):
149 def next(self):
150 l = self.fp.readline()
150 l = self.fp.readline()
151 if not l:
151 if not l:
152 raise StopIteration
152 raise StopIteration
153 return l
153 return l
154
154
155 __next__ = next
155 __next__ = next
156
156
157 inheader = False
157 inheader = False
158 cur = []
158 cur = []
159
159
160 mimeheaders = ['content-type']
160 mimeheaders = ['content-type']
161
161
162 if not util.safehasattr(stream, 'next'):
162 if not util.safehasattr(stream, 'next'):
163 # http responses, for example, have readline but not next
163 # http responses, for example, have readline but not next
164 stream = fiter(stream)
164 stream = fiter(stream)
165
165
166 for line in stream:
166 for line in stream:
167 cur.append(line)
167 cur.append(line)
168 if line.startswith('# HG changeset patch'):
168 if line.startswith('# HG changeset patch'):
169 return hgsplit(stream, cur)
169 return hgsplit(stream, cur)
170 elif line.startswith('From '):
170 elif line.startswith('From '):
171 return mboxsplit(stream, cur)
171 return mboxsplit(stream, cur)
172 elif isheader(line, inheader):
172 elif isheader(line, inheader):
173 inheader = True
173 inheader = True
174 if line.split(':', 1)[0].lower() in mimeheaders:
174 if line.split(':', 1)[0].lower() in mimeheaders:
175 # let email parser handle this
175 # let email parser handle this
176 return mimesplit(stream, cur)
176 return mimesplit(stream, cur)
177 elif line.startswith('--- ') and inheader:
177 elif line.startswith('--- ') and inheader:
178 # No evil headers seen by diff start, split by hand
178 # No evil headers seen by diff start, split by hand
179 return headersplit(stream, cur)
179 return headersplit(stream, cur)
180 # Not enough info, keep reading
180 # Not enough info, keep reading
181
181
182 # if we are here, we have a very plain patch
182 # if we are here, we have a very plain patch
183 return remainder(cur)
183 return remainder(cur)
184
184
185 ## Some facility for extensible patch parsing:
185 ## Some facility for extensible patch parsing:
186 # list of pairs ("header to match", "data key")
186 # list of pairs ("header to match", "data key")
187 patchheadermap = [('Date', 'date'),
187 patchheadermap = [('Date', 'date'),
188 ('Branch', 'branch'),
188 ('Branch', 'branch'),
189 ('Node ID', 'nodeid'),
189 ('Node ID', 'nodeid'),
190 ]
190 ]
191
191
192 def extract(ui, fileobj):
192 def extract(ui, fileobj):
193 '''extract patch from data read from fileobj.
193 '''extract patch from data read from fileobj.
194
194
195 patch can be a normal patch or contained in an email message.
195 patch can be a normal patch or contained in an email message.
196
196
197 return a dictionary. Standard keys are:
197 return a dictionary. Standard keys are:
198 - filename,
198 - filename,
199 - message,
199 - message,
200 - user,
200 - user,
201 - date,
201 - date,
202 - branch,
202 - branch,
203 - node,
203 - node,
204 - p1,
204 - p1,
205 - p2.
205 - p2.
206 Any item can be missing from the dictionary. If filename is missing,
206 Any item can be missing from the dictionary. If filename is missing,
207 fileobj did not contain a patch. Caller must unlink filename when done.'''
207 fileobj did not contain a patch. Caller must unlink filename when done.'''
208
208
209 # attempt to detect the start of a patch
209 # attempt to detect the start of a patch
210 # (this heuristic is borrowed from quilt)
210 # (this heuristic is borrowed from quilt)
211 diffre = re.compile(br'^(?:Index:[ \t]|diff[ \t]-|RCS file: |'
211 diffre = re.compile(br'^(?:Index:[ \t]|diff[ \t]-|RCS file: |'
212 br'retrieving revision [0-9]+(\.[0-9]+)*$|'
212 br'retrieving revision [0-9]+(\.[0-9]+)*$|'
213 br'---[ \t].*?^\+\+\+[ \t]|'
213 br'---[ \t].*?^\+\+\+[ \t]|'
214 br'\*\*\*[ \t].*?^---[ \t])',
214 br'\*\*\*[ \t].*?^---[ \t])',
215 re.MULTILINE | re.DOTALL)
215 re.MULTILINE | re.DOTALL)
216
216
217 data = {}
217 data = {}
218 fd, tmpname = tempfile.mkstemp(prefix='hg-patch-')
218 fd, tmpname = tempfile.mkstemp(prefix='hg-patch-')
219 tmpfp = os.fdopen(fd, pycompat.sysstr('w'))
219 tmpfp = os.fdopen(fd, pycompat.sysstr('w'))
220 try:
220 try:
221 msg = emailparser.Parser().parse(fileobj)
221 msg = emailparser.Parser().parse(fileobj)
222
222
223 subject = msg['Subject'] and mail.headdecode(msg['Subject'])
223 subject = msg['Subject'] and mail.headdecode(msg['Subject'])
224 data['user'] = msg['From'] and mail.headdecode(msg['From'])
224 data['user'] = msg['From'] and mail.headdecode(msg['From'])
225 if not subject and not data['user']:
225 if not subject and not data['user']:
226 # Not an email, restore parsed headers if any
226 # Not an email, restore parsed headers if any
227 subject = '\n'.join(': '.join(h) for h in msg.items()) + '\n'
227 subject = '\n'.join(': '.join(h) for h in msg.items()) + '\n'
228
228
229 # should try to parse msg['Date']
229 # should try to parse msg['Date']
230 parents = []
230 parents = []
231
231
232 if subject:
232 if subject:
233 if subject.startswith('[PATCH'):
233 if subject.startswith('[PATCH'):
234 pend = subject.find(']')
234 pend = subject.find(']')
235 if pend >= 0:
235 if pend >= 0:
236 subject = subject[pend + 1:].lstrip()
236 subject = subject[pend + 1:].lstrip()
237 subject = re.sub(br'\n[ \t]+', ' ', subject)
237 subject = re.sub(br'\n[ \t]+', ' ', subject)
238 ui.debug('Subject: %s\n' % subject)
238 ui.debug('Subject: %s\n' % subject)
239 if data['user']:
239 if data['user']:
240 ui.debug('From: %s\n' % data['user'])
240 ui.debug('From: %s\n' % data['user'])
241 diffs_seen = 0
241 diffs_seen = 0
242 ok_types = ('text/plain', 'text/x-diff', 'text/x-patch')
242 ok_types = ('text/plain', 'text/x-diff', 'text/x-patch')
243 message = ''
243 message = ''
244 for part in msg.walk():
244 for part in msg.walk():
245 content_type = part.get_content_type()
245 content_type = part.get_content_type()
246 ui.debug('Content-Type: %s\n' % content_type)
246 ui.debug('Content-Type: %s\n' % content_type)
247 if content_type not in ok_types:
247 if content_type not in ok_types:
248 continue
248 continue
249 payload = part.get_payload(decode=True)
249 payload = part.get_payload(decode=True)
250 m = diffre.search(payload)
250 m = diffre.search(payload)
251 if m:
251 if m:
252 hgpatch = False
252 hgpatch = False
253 hgpatchheader = False
253 hgpatchheader = False
254 ignoretext = False
254 ignoretext = False
255
255
256 ui.debug('found patch at byte %d\n' % m.start(0))
256 ui.debug('found patch at byte %d\n' % m.start(0))
257 diffs_seen += 1
257 diffs_seen += 1
258 cfp = stringio()
258 cfp = stringio()
259 for line in payload[:m.start(0)].splitlines():
259 for line in payload[:m.start(0)].splitlines():
260 if line.startswith('# HG changeset patch') and not hgpatch:
260 if line.startswith('# HG changeset patch') and not hgpatch:
261 ui.debug('patch generated by hg export\n')
261 ui.debug('patch generated by hg export\n')
262 hgpatch = True
262 hgpatch = True
263 hgpatchheader = True
263 hgpatchheader = True
264 # drop earlier commit message content
264 # drop earlier commit message content
265 cfp.seek(0)
265 cfp.seek(0)
266 cfp.truncate()
266 cfp.truncate()
267 subject = None
267 subject = None
268 elif hgpatchheader:
268 elif hgpatchheader:
269 if line.startswith('# User '):
269 if line.startswith('# User '):
270 data['user'] = line[7:]
270 data['user'] = line[7:]
271 ui.debug('From: %s\n' % data['user'])
271 ui.debug('From: %s\n' % data['user'])
272 elif line.startswith("# Parent "):
272 elif line.startswith("# Parent "):
273 parents.append(line[9:].lstrip())
273 parents.append(line[9:].lstrip())
274 elif line.startswith("# "):
274 elif line.startswith("# "):
275 for header, key in patchheadermap:
275 for header, key in patchheadermap:
276 prefix = '# %s ' % header
276 prefix = '# %s ' % header
277 if line.startswith(prefix):
277 if line.startswith(prefix):
278 data[key] = line[len(prefix):]
278 data[key] = line[len(prefix):]
279 else:
279 else:
280 hgpatchheader = False
280 hgpatchheader = False
281 elif line == '---':
281 elif line == '---':
282 ignoretext = True
282 ignoretext = True
283 if not hgpatchheader and not ignoretext:
283 if not hgpatchheader and not ignoretext:
284 cfp.write(line)
284 cfp.write(line)
285 cfp.write('\n')
285 cfp.write('\n')
286 message = cfp.getvalue()
286 message = cfp.getvalue()
287 if tmpfp:
287 if tmpfp:
288 tmpfp.write(payload)
288 tmpfp.write(payload)
289 if not payload.endswith('\n'):
289 if not payload.endswith('\n'):
290 tmpfp.write('\n')
290 tmpfp.write('\n')
291 elif not diffs_seen and message and content_type == 'text/plain':
291 elif not diffs_seen and message and content_type == 'text/plain':
292 message += '\n' + payload
292 message += '\n' + payload
293 except: # re-raises
293 except: # re-raises
294 tmpfp.close()
294 tmpfp.close()
295 os.unlink(tmpname)
295 os.unlink(tmpname)
296 raise
296 raise
297
297
298 if subject and not message.startswith(subject):
298 if subject and not message.startswith(subject):
299 message = '%s\n%s' % (subject, message)
299 message = '%s\n%s' % (subject, message)
300 data['message'] = message
300 data['message'] = message
301 tmpfp.close()
301 tmpfp.close()
302 if parents:
302 if parents:
303 data['p1'] = parents.pop(0)
303 data['p1'] = parents.pop(0)
304 if parents:
304 if parents:
305 data['p2'] = parents.pop(0)
305 data['p2'] = parents.pop(0)
306
306
307 if diffs_seen:
307 if diffs_seen:
308 data['filename'] = tmpname
308 data['filename'] = tmpname
309 else:
309 else:
310 os.unlink(tmpname)
310 os.unlink(tmpname)
311 return data
311 return data
312
312
313 class patchmeta(object):
313 class patchmeta(object):
314 """Patched file metadata
314 """Patched file metadata
315
315
316 'op' is the performed operation within ADD, DELETE, RENAME, MODIFY
316 'op' is the performed operation within ADD, DELETE, RENAME, MODIFY
317 or COPY. 'path' is patched file path. 'oldpath' is set to the
317 or COPY. 'path' is patched file path. 'oldpath' is set to the
318 origin file when 'op' is either COPY or RENAME, None otherwise. If
318 origin file when 'op' is either COPY or RENAME, None otherwise. If
319 file mode is changed, 'mode' is a tuple (islink, isexec) where
319 file mode is changed, 'mode' is a tuple (islink, isexec) where
320 'islink' is True if the file is a symlink and 'isexec' is True if
320 'islink' is True if the file is a symlink and 'isexec' is True if
321 the file is executable. Otherwise, 'mode' is None.
321 the file is executable. Otherwise, 'mode' is None.
322 """
322 """
323 def __init__(self, path):
323 def __init__(self, path):
324 self.path = path
324 self.path = path
325 self.oldpath = None
325 self.oldpath = None
326 self.mode = None
326 self.mode = None
327 self.op = 'MODIFY'
327 self.op = 'MODIFY'
328 self.binary = False
328 self.binary = False
329
329
330 def setmode(self, mode):
330 def setmode(self, mode):
331 islink = mode & 0o20000
331 islink = mode & 0o20000
332 isexec = mode & 0o100
332 isexec = mode & 0o100
333 self.mode = (islink, isexec)
333 self.mode = (islink, isexec)
334
334
335 def copy(self):
335 def copy(self):
336 other = patchmeta(self.path)
336 other = patchmeta(self.path)
337 other.oldpath = self.oldpath
337 other.oldpath = self.oldpath
338 other.mode = self.mode
338 other.mode = self.mode
339 other.op = self.op
339 other.op = self.op
340 other.binary = self.binary
340 other.binary = self.binary
341 return other
341 return other
342
342
343 def _ispatchinga(self, afile):
343 def _ispatchinga(self, afile):
344 if afile == '/dev/null':
344 if afile == '/dev/null':
345 return self.op == 'ADD'
345 return self.op == 'ADD'
346 return afile == 'a/' + (self.oldpath or self.path)
346 return afile == 'a/' + (self.oldpath or self.path)
347
347
348 def _ispatchingb(self, bfile):
348 def _ispatchingb(self, bfile):
349 if bfile == '/dev/null':
349 if bfile == '/dev/null':
350 return self.op == 'DELETE'
350 return self.op == 'DELETE'
351 return bfile == 'b/' + self.path
351 return bfile == 'b/' + self.path
352
352
353 def ispatching(self, afile, bfile):
353 def ispatching(self, afile, bfile):
354 return self._ispatchinga(afile) and self._ispatchingb(bfile)
354 return self._ispatchinga(afile) and self._ispatchingb(bfile)
355
355
356 def __repr__(self):
356 def __repr__(self):
357 return "<patchmeta %s %r>" % (self.op, self.path)
357 return "<patchmeta %s %r>" % (self.op, self.path)
358
358
359 def readgitpatch(lr):
359 def readgitpatch(lr):
360 """extract git-style metadata about patches from <patchname>"""
360 """extract git-style metadata about patches from <patchname>"""
361
361
362 # Filter patch for git information
362 # Filter patch for git information
363 gp = None
363 gp = None
364 gitpatches = []
364 gitpatches = []
365 for line in lr:
365 for line in lr:
366 line = line.rstrip(' \r\n')
366 line = line.rstrip(' \r\n')
367 if line.startswith('diff --git a/'):
367 if line.startswith('diff --git a/'):
368 m = gitre.match(line)
368 m = gitre.match(line)
369 if m:
369 if m:
370 if gp:
370 if gp:
371 gitpatches.append(gp)
371 gitpatches.append(gp)
372 dst = m.group(2)
372 dst = m.group(2)
373 gp = patchmeta(dst)
373 gp = patchmeta(dst)
374 elif gp:
374 elif gp:
375 if line.startswith('--- '):
375 if line.startswith('--- '):
376 gitpatches.append(gp)
376 gitpatches.append(gp)
377 gp = None
377 gp = None
378 continue
378 continue
379 if line.startswith('rename from '):
379 if line.startswith('rename from '):
380 gp.op = 'RENAME'
380 gp.op = 'RENAME'
381 gp.oldpath = line[12:]
381 gp.oldpath = line[12:]
382 elif line.startswith('rename to '):
382 elif line.startswith('rename to '):
383 gp.path = line[10:]
383 gp.path = line[10:]
384 elif line.startswith('copy from '):
384 elif line.startswith('copy from '):
385 gp.op = 'COPY'
385 gp.op = 'COPY'
386 gp.oldpath = line[10:]
386 gp.oldpath = line[10:]
387 elif line.startswith('copy to '):
387 elif line.startswith('copy to '):
388 gp.path = line[8:]
388 gp.path = line[8:]
389 elif line.startswith('deleted file'):
389 elif line.startswith('deleted file'):
390 gp.op = 'DELETE'
390 gp.op = 'DELETE'
391 elif line.startswith('new file mode '):
391 elif line.startswith('new file mode '):
392 gp.op = 'ADD'
392 gp.op = 'ADD'
393 gp.setmode(int(line[-6:], 8))
393 gp.setmode(int(line[-6:], 8))
394 elif line.startswith('new mode '):
394 elif line.startswith('new mode '):
395 gp.setmode(int(line[-6:], 8))
395 gp.setmode(int(line[-6:], 8))
396 elif line.startswith('GIT binary patch'):
396 elif line.startswith('GIT binary patch'):
397 gp.binary = True
397 gp.binary = True
398 if gp:
398 if gp:
399 gitpatches.append(gp)
399 gitpatches.append(gp)
400
400
401 return gitpatches
401 return gitpatches
402
402
403 class linereader(object):
403 class linereader(object):
404 # simple class to allow pushing lines back into the input stream
404 # simple class to allow pushing lines back into the input stream
405 def __init__(self, fp):
405 def __init__(self, fp):
406 self.fp = fp
406 self.fp = fp
407 self.buf = []
407 self.buf = []
408
408
409 def push(self, line):
409 def push(self, line):
410 if line is not None:
410 if line is not None:
411 self.buf.append(line)
411 self.buf.append(line)
412
412
413 def readline(self):
413 def readline(self):
414 if self.buf:
414 if self.buf:
415 l = self.buf[0]
415 l = self.buf[0]
416 del self.buf[0]
416 del self.buf[0]
417 return l
417 return l
418 return self.fp.readline()
418 return self.fp.readline()
419
419
420 def __iter__(self):
420 def __iter__(self):
421 return iter(self.readline, '')
421 return iter(self.readline, '')
422
422
423 class abstractbackend(object):
423 class abstractbackend(object):
424 def __init__(self, ui):
424 def __init__(self, ui):
425 self.ui = ui
425 self.ui = ui
426
426
427 def getfile(self, fname):
427 def getfile(self, fname):
428 """Return target file data and flags as a (data, (islink,
428 """Return target file data and flags as a (data, (islink,
429 isexec)) tuple. Data is None if file is missing/deleted.
429 isexec)) tuple. Data is None if file is missing/deleted.
430 """
430 """
431 raise NotImplementedError
431 raise NotImplementedError
432
432
433 def setfile(self, fname, data, mode, copysource):
433 def setfile(self, fname, data, mode, copysource):
434 """Write data to target file fname and set its mode. mode is a
434 """Write data to target file fname and set its mode. mode is a
435 (islink, isexec) tuple. If data is None, the file content should
435 (islink, isexec) tuple. If data is None, the file content should
436 be left unchanged. If the file is modified after being copied,
436 be left unchanged. If the file is modified after being copied,
437 copysource is set to the original file name.
437 copysource is set to the original file name.
438 """
438 """
439 raise NotImplementedError
439 raise NotImplementedError
440
440
441 def unlink(self, fname):
441 def unlink(self, fname):
442 """Unlink target file."""
442 """Unlink target file."""
443 raise NotImplementedError
443 raise NotImplementedError
444
444
445 def writerej(self, fname, failed, total, lines):
445 def writerej(self, fname, failed, total, lines):
446 """Write rejected lines for fname. total is the number of hunks
446 """Write rejected lines for fname. total is the number of hunks
447 which failed to apply and total the total number of hunks for this
447 which failed to apply and total the total number of hunks for this
448 files.
448 files.
449 """
449 """
450
450
451 def exists(self, fname):
451 def exists(self, fname):
452 raise NotImplementedError
452 raise NotImplementedError
453
453
454 def close(self):
454 def close(self):
455 raise NotImplementedError
455 raise NotImplementedError
456
456
457 class fsbackend(abstractbackend):
457 class fsbackend(abstractbackend):
458 def __init__(self, ui, basedir):
458 def __init__(self, ui, basedir):
459 super(fsbackend, self).__init__(ui)
459 super(fsbackend, self).__init__(ui)
460 self.opener = vfsmod.vfs(basedir)
460 self.opener = vfsmod.vfs(basedir)
461
461
462 def getfile(self, fname):
462 def getfile(self, fname):
463 if self.opener.islink(fname):
463 if self.opener.islink(fname):
464 return (self.opener.readlink(fname), (True, False))
464 return (self.opener.readlink(fname), (True, False))
465
465
466 isexec = False
466 isexec = False
467 try:
467 try:
468 isexec = self.opener.lstat(fname).st_mode & 0o100 != 0
468 isexec = self.opener.lstat(fname).st_mode & 0o100 != 0
469 except OSError as e:
469 except OSError as e:
470 if e.errno != errno.ENOENT:
470 if e.errno != errno.ENOENT:
471 raise
471 raise
472 try:
472 try:
473 return (self.opener.read(fname), (False, isexec))
473 return (self.opener.read(fname), (False, isexec))
474 except IOError as e:
474 except IOError as e:
475 if e.errno != errno.ENOENT:
475 if e.errno != errno.ENOENT:
476 raise
476 raise
477 return None, None
477 return None, None
478
478
479 def setfile(self, fname, data, mode, copysource):
479 def setfile(self, fname, data, mode, copysource):
480 islink, isexec = mode
480 islink, isexec = mode
481 if data is None:
481 if data is None:
482 self.opener.setflags(fname, islink, isexec)
482 self.opener.setflags(fname, islink, isexec)
483 return
483 return
484 if islink:
484 if islink:
485 self.opener.symlink(data, fname)
485 self.opener.symlink(data, fname)
486 else:
486 else:
487 self.opener.write(fname, data)
487 self.opener.write(fname, data)
488 if isexec:
488 if isexec:
489 self.opener.setflags(fname, False, True)
489 self.opener.setflags(fname, False, True)
490
490
491 def unlink(self, fname):
491 def unlink(self, fname):
492 self.opener.unlinkpath(fname, ignoremissing=True)
492 self.opener.unlinkpath(fname, ignoremissing=True)
493
493
494 def writerej(self, fname, failed, total, lines):
494 def writerej(self, fname, failed, total, lines):
495 fname = fname + ".rej"
495 fname = fname + ".rej"
496 self.ui.warn(
496 self.ui.warn(
497 _("%d out of %d hunks FAILED -- saving rejects to file %s\n") %
497 _("%d out of %d hunks FAILED -- saving rejects to file %s\n") %
498 (failed, total, fname))
498 (failed, total, fname))
499 fp = self.opener(fname, 'w')
499 fp = self.opener(fname, 'w')
500 fp.writelines(lines)
500 fp.writelines(lines)
501 fp.close()
501 fp.close()
502
502
503 def exists(self, fname):
503 def exists(self, fname):
504 return self.opener.lexists(fname)
504 return self.opener.lexists(fname)
505
505
506 class workingbackend(fsbackend):
506 class workingbackend(fsbackend):
507 def __init__(self, ui, repo, similarity):
507 def __init__(self, ui, repo, similarity):
508 super(workingbackend, self).__init__(ui, repo.root)
508 super(workingbackend, self).__init__(ui, repo.root)
509 self.repo = repo
509 self.repo = repo
510 self.similarity = similarity
510 self.similarity = similarity
511 self.removed = set()
511 self.removed = set()
512 self.changed = set()
512 self.changed = set()
513 self.copied = []
513 self.copied = []
514
514
515 def _checkknown(self, fname):
515 def _checkknown(self, fname):
516 if self.repo.dirstate[fname] == '?' and self.exists(fname):
516 if self.repo.dirstate[fname] == '?' and self.exists(fname):
517 raise PatchError(_('cannot patch %s: file is not tracked') % fname)
517 raise PatchError(_('cannot patch %s: file is not tracked') % fname)
518
518
519 def setfile(self, fname, data, mode, copysource):
519 def setfile(self, fname, data, mode, copysource):
520 self._checkknown(fname)
520 self._checkknown(fname)
521 super(workingbackend, self).setfile(fname, data, mode, copysource)
521 super(workingbackend, self).setfile(fname, data, mode, copysource)
522 if copysource is not None:
522 if copysource is not None:
523 self.copied.append((copysource, fname))
523 self.copied.append((copysource, fname))
524 self.changed.add(fname)
524 self.changed.add(fname)
525
525
526 def unlink(self, fname):
526 def unlink(self, fname):
527 self._checkknown(fname)
527 self._checkknown(fname)
528 super(workingbackend, self).unlink(fname)
528 super(workingbackend, self).unlink(fname)
529 self.removed.add(fname)
529 self.removed.add(fname)
530 self.changed.add(fname)
530 self.changed.add(fname)
531
531
532 def close(self):
532 def close(self):
533 wctx = self.repo[None]
533 wctx = self.repo[None]
534 changed = set(self.changed)
534 changed = set(self.changed)
535 for src, dst in self.copied:
535 for src, dst in self.copied:
536 scmutil.dirstatecopy(self.ui, self.repo, wctx, src, dst)
536 scmutil.dirstatecopy(self.ui, self.repo, wctx, src, dst)
537 if self.removed:
537 if self.removed:
538 wctx.forget(sorted(self.removed))
538 wctx.forget(sorted(self.removed))
539 for f in self.removed:
539 for f in self.removed:
540 if f not in self.repo.dirstate:
540 if f not in self.repo.dirstate:
541 # File was deleted and no longer belongs to the
541 # File was deleted and no longer belongs to the
542 # dirstate, it was probably marked added then
542 # dirstate, it was probably marked added then
543 # deleted, and should not be considered by
543 # deleted, and should not be considered by
544 # marktouched().
544 # marktouched().
545 changed.discard(f)
545 changed.discard(f)
546 if changed:
546 if changed:
547 scmutil.marktouched(self.repo, changed, self.similarity)
547 scmutil.marktouched(self.repo, changed, self.similarity)
548 return sorted(self.changed)
548 return sorted(self.changed)
549
549
550 class filestore(object):
550 class filestore(object):
551 def __init__(self, maxsize=None):
551 def __init__(self, maxsize=None):
552 self.opener = None
552 self.opener = None
553 self.files = {}
553 self.files = {}
554 self.created = 0
554 self.created = 0
555 self.maxsize = maxsize
555 self.maxsize = maxsize
556 if self.maxsize is None:
556 if self.maxsize is None:
557 self.maxsize = 4*(2**20)
557 self.maxsize = 4*(2**20)
558 self.size = 0
558 self.size = 0
559 self.data = {}
559 self.data = {}
560
560
561 def setfile(self, fname, data, mode, copied=None):
561 def setfile(self, fname, data, mode, copied=None):
562 if self.maxsize < 0 or (len(data) + self.size) <= self.maxsize:
562 if self.maxsize < 0 or (len(data) + self.size) <= self.maxsize:
563 self.data[fname] = (data, mode, copied)
563 self.data[fname] = (data, mode, copied)
564 self.size += len(data)
564 self.size += len(data)
565 else:
565 else:
566 if self.opener is None:
566 if self.opener is None:
567 root = tempfile.mkdtemp(prefix='hg-patch-')
567 root = tempfile.mkdtemp(prefix='hg-patch-')
568 self.opener = vfsmod.vfs(root)
568 self.opener = vfsmod.vfs(root)
569 # Avoid filename issues with these simple names
569 # Avoid filename issues with these simple names
570 fn = str(self.created)
570 fn = str(self.created)
571 self.opener.write(fn, data)
571 self.opener.write(fn, data)
572 self.created += 1
572 self.created += 1
573 self.files[fname] = (fn, mode, copied)
573 self.files[fname] = (fn, mode, copied)
574
574
575 def getfile(self, fname):
575 def getfile(self, fname):
576 if fname in self.data:
576 if fname in self.data:
577 return self.data[fname]
577 return self.data[fname]
578 if not self.opener or fname not in self.files:
578 if not self.opener or fname not in self.files:
579 return None, None, None
579 return None, None, None
580 fn, mode, copied = self.files[fname]
580 fn, mode, copied = self.files[fname]
581 return self.opener.read(fn), mode, copied
581 return self.opener.read(fn), mode, copied
582
582
583 def close(self):
583 def close(self):
584 if self.opener:
584 if self.opener:
585 shutil.rmtree(self.opener.base)
585 shutil.rmtree(self.opener.base)
586
586
587 class repobackend(abstractbackend):
587 class repobackend(abstractbackend):
588 def __init__(self, ui, repo, ctx, store):
588 def __init__(self, ui, repo, ctx, store):
589 super(repobackend, self).__init__(ui)
589 super(repobackend, self).__init__(ui)
590 self.repo = repo
590 self.repo = repo
591 self.ctx = ctx
591 self.ctx = ctx
592 self.store = store
592 self.store = store
593 self.changed = set()
593 self.changed = set()
594 self.removed = set()
594 self.removed = set()
595 self.copied = {}
595 self.copied = {}
596
596
597 def _checkknown(self, fname):
597 def _checkknown(self, fname):
598 if fname not in self.ctx:
598 if fname not in self.ctx:
599 raise PatchError(_('cannot patch %s: file is not tracked') % fname)
599 raise PatchError(_('cannot patch %s: file is not tracked') % fname)
600
600
601 def getfile(self, fname):
601 def getfile(self, fname):
602 try:
602 try:
603 fctx = self.ctx[fname]
603 fctx = self.ctx[fname]
604 except error.LookupError:
604 except error.LookupError:
605 return None, None
605 return None, None
606 flags = fctx.flags()
606 flags = fctx.flags()
607 return fctx.data(), ('l' in flags, 'x' in flags)
607 return fctx.data(), ('l' in flags, 'x' in flags)
608
608
609 def setfile(self, fname, data, mode, copysource):
609 def setfile(self, fname, data, mode, copysource):
610 if copysource:
610 if copysource:
611 self._checkknown(copysource)
611 self._checkknown(copysource)
612 if data is None:
612 if data is None:
613 data = self.ctx[fname].data()
613 data = self.ctx[fname].data()
614 self.store.setfile(fname, data, mode, copysource)
614 self.store.setfile(fname, data, mode, copysource)
615 self.changed.add(fname)
615 self.changed.add(fname)
616 if copysource:
616 if copysource:
617 self.copied[fname] = copysource
617 self.copied[fname] = copysource
618
618
619 def unlink(self, fname):
619 def unlink(self, fname):
620 self._checkknown(fname)
620 self._checkknown(fname)
621 self.removed.add(fname)
621 self.removed.add(fname)
622
622
623 def exists(self, fname):
623 def exists(self, fname):
624 return fname in self.ctx
624 return fname in self.ctx
625
625
626 def close(self):
626 def close(self):
627 return self.changed | self.removed
627 return self.changed | self.removed
628
628
629 # @@ -start,len +start,len @@ or @@ -start +start @@ if len is 1
629 # @@ -start,len +start,len @@ or @@ -start +start @@ if len is 1
630 unidesc = re.compile('@@ -(\d+)(?:,(\d+))? \+(\d+)(?:,(\d+))? @@')
630 unidesc = re.compile('@@ -(\d+)(?:,(\d+))? \+(\d+)(?:,(\d+))? @@')
631 contextdesc = re.compile('(?:---|\*\*\*) (\d+)(?:,(\d+))? (?:---|\*\*\*)')
631 contextdesc = re.compile('(?:---|\*\*\*) (\d+)(?:,(\d+))? (?:---|\*\*\*)')
632 eolmodes = ['strict', 'crlf', 'lf', 'auto']
632 eolmodes = ['strict', 'crlf', 'lf', 'auto']
633
633
634 class patchfile(object):
634 class patchfile(object):
635 def __init__(self, ui, gp, backend, store, eolmode='strict'):
635 def __init__(self, ui, gp, backend, store, eolmode='strict'):
636 self.fname = gp.path
636 self.fname = gp.path
637 self.eolmode = eolmode
637 self.eolmode = eolmode
638 self.eol = None
638 self.eol = None
639 self.backend = backend
639 self.backend = backend
640 self.ui = ui
640 self.ui = ui
641 self.lines = []
641 self.lines = []
642 self.exists = False
642 self.exists = False
643 self.missing = True
643 self.missing = True
644 self.mode = gp.mode
644 self.mode = gp.mode
645 self.copysource = gp.oldpath
645 self.copysource = gp.oldpath
646 self.create = gp.op in ('ADD', 'COPY', 'RENAME')
646 self.create = gp.op in ('ADD', 'COPY', 'RENAME')
647 self.remove = gp.op == 'DELETE'
647 self.remove = gp.op == 'DELETE'
648 if self.copysource is None:
648 if self.copysource is None:
649 data, mode = backend.getfile(self.fname)
649 data, mode = backend.getfile(self.fname)
650 else:
650 else:
651 data, mode = store.getfile(self.copysource)[:2]
651 data, mode = store.getfile(self.copysource)[:2]
652 if data is not None:
652 if data is not None:
653 self.exists = self.copysource is None or backend.exists(self.fname)
653 self.exists = self.copysource is None or backend.exists(self.fname)
654 self.missing = False
654 self.missing = False
655 if data:
655 if data:
656 self.lines = mdiff.splitnewlines(data)
656 self.lines = mdiff.splitnewlines(data)
657 if self.mode is None:
657 if self.mode is None:
658 self.mode = mode
658 self.mode = mode
659 if self.lines:
659 if self.lines:
660 # Normalize line endings
660 # Normalize line endings
661 if self.lines[0].endswith('\r\n'):
661 if self.lines[0].endswith('\r\n'):
662 self.eol = '\r\n'
662 self.eol = '\r\n'
663 elif self.lines[0].endswith('\n'):
663 elif self.lines[0].endswith('\n'):
664 self.eol = '\n'
664 self.eol = '\n'
665 if eolmode != 'strict':
665 if eolmode != 'strict':
666 nlines = []
666 nlines = []
667 for l in self.lines:
667 for l in self.lines:
668 if l.endswith('\r\n'):
668 if l.endswith('\r\n'):
669 l = l[:-2] + '\n'
669 l = l[:-2] + '\n'
670 nlines.append(l)
670 nlines.append(l)
671 self.lines = nlines
671 self.lines = nlines
672 else:
672 else:
673 if self.create:
673 if self.create:
674 self.missing = False
674 self.missing = False
675 if self.mode is None:
675 if self.mode is None:
676 self.mode = (False, False)
676 self.mode = (False, False)
677 if self.missing:
677 if self.missing:
678 self.ui.warn(_("unable to find '%s' for patching\n") % self.fname)
678 self.ui.warn(_("unable to find '%s' for patching\n") % self.fname)
679 self.ui.warn(_("(use '--prefix' to apply patch relative to the "
679 self.ui.warn(_("(use '--prefix' to apply patch relative to the "
680 "current directory)\n"))
680 "current directory)\n"))
681
681
682 self.hash = {}
682 self.hash = {}
683 self.dirty = 0
683 self.dirty = 0
684 self.offset = 0
684 self.offset = 0
685 self.skew = 0
685 self.skew = 0
686 self.rej = []
686 self.rej = []
687 self.fileprinted = False
687 self.fileprinted = False
688 self.printfile(False)
688 self.printfile(False)
689 self.hunks = 0
689 self.hunks = 0
690
690
691 def writelines(self, fname, lines, mode):
691 def writelines(self, fname, lines, mode):
692 if self.eolmode == 'auto':
692 if self.eolmode == 'auto':
693 eol = self.eol
693 eol = self.eol
694 elif self.eolmode == 'crlf':
694 elif self.eolmode == 'crlf':
695 eol = '\r\n'
695 eol = '\r\n'
696 else:
696 else:
697 eol = '\n'
697 eol = '\n'
698
698
699 if self.eolmode != 'strict' and eol and eol != '\n':
699 if self.eolmode != 'strict' and eol and eol != '\n':
700 rawlines = []
700 rawlines = []
701 for l in lines:
701 for l in lines:
702 if l and l[-1] == '\n':
702 if l and l[-1] == '\n':
703 l = l[:-1] + eol
703 l = l[:-1] + eol
704 rawlines.append(l)
704 rawlines.append(l)
705 lines = rawlines
705 lines = rawlines
706
706
707 self.backend.setfile(fname, ''.join(lines), mode, self.copysource)
707 self.backend.setfile(fname, ''.join(lines), mode, self.copysource)
708
708
709 def printfile(self, warn):
709 def printfile(self, warn):
710 if self.fileprinted:
710 if self.fileprinted:
711 return
711 return
712 if warn or self.ui.verbose:
712 if warn or self.ui.verbose:
713 self.fileprinted = True
713 self.fileprinted = True
714 s = _("patching file %s\n") % self.fname
714 s = _("patching file %s\n") % self.fname
715 if warn:
715 if warn:
716 self.ui.warn(s)
716 self.ui.warn(s)
717 else:
717 else:
718 self.ui.note(s)
718 self.ui.note(s)
719
719
720
720
721 def findlines(self, l, linenum):
721 def findlines(self, l, linenum):
722 # looks through the hash and finds candidate lines. The
722 # looks through the hash and finds candidate lines. The
723 # result is a list of line numbers sorted based on distance
723 # result is a list of line numbers sorted based on distance
724 # from linenum
724 # from linenum
725
725
726 cand = self.hash.get(l, [])
726 cand = self.hash.get(l, [])
727 if len(cand) > 1:
727 if len(cand) > 1:
728 # resort our list of potentials forward then back.
728 # resort our list of potentials forward then back.
729 cand.sort(key=lambda x: abs(x - linenum))
729 cand.sort(key=lambda x: abs(x - linenum))
730 return cand
730 return cand
731
731
732 def write_rej(self):
732 def write_rej(self):
733 # our rejects are a little different from patch(1). This always
733 # our rejects are a little different from patch(1). This always
734 # creates rejects in the same form as the original patch. A file
734 # creates rejects in the same form as the original patch. A file
735 # header is inserted so that you can run the reject through patch again
735 # header is inserted so that you can run the reject through patch again
736 # without having to type the filename.
736 # without having to type the filename.
737 if not self.rej:
737 if not self.rej:
738 return
738 return
739 base = os.path.basename(self.fname)
739 base = os.path.basename(self.fname)
740 lines = ["--- %s\n+++ %s\n" % (base, base)]
740 lines = ["--- %s\n+++ %s\n" % (base, base)]
741 for x in self.rej:
741 for x in self.rej:
742 for l in x.hunk:
742 for l in x.hunk:
743 lines.append(l)
743 lines.append(l)
744 if l[-1:] != '\n':
744 if l[-1:] != '\n':
745 lines.append("\n\ No newline at end of file\n")
745 lines.append("\n\ No newline at end of file\n")
746 self.backend.writerej(self.fname, len(self.rej), self.hunks, lines)
746 self.backend.writerej(self.fname, len(self.rej), self.hunks, lines)
747
747
748 def apply(self, h):
748 def apply(self, h):
749 if not h.complete():
749 if not h.complete():
750 raise PatchError(_("bad hunk #%d %s (%d %d %d %d)") %
750 raise PatchError(_("bad hunk #%d %s (%d %d %d %d)") %
751 (h.number, h.desc, len(h.a), h.lena, len(h.b),
751 (h.number, h.desc, len(h.a), h.lena, len(h.b),
752 h.lenb))
752 h.lenb))
753
753
754 self.hunks += 1
754 self.hunks += 1
755
755
756 if self.missing:
756 if self.missing:
757 self.rej.append(h)
757 self.rej.append(h)
758 return -1
758 return -1
759
759
760 if self.exists and self.create:
760 if self.exists and self.create:
761 if self.copysource:
761 if self.copysource:
762 self.ui.warn(_("cannot create %s: destination already "
762 self.ui.warn(_("cannot create %s: destination already "
763 "exists\n") % self.fname)
763 "exists\n") % self.fname)
764 else:
764 else:
765 self.ui.warn(_("file %s already exists\n") % self.fname)
765 self.ui.warn(_("file %s already exists\n") % self.fname)
766 self.rej.append(h)
766 self.rej.append(h)
767 return -1
767 return -1
768
768
769 if isinstance(h, binhunk):
769 if isinstance(h, binhunk):
770 if self.remove:
770 if self.remove:
771 self.backend.unlink(self.fname)
771 self.backend.unlink(self.fname)
772 else:
772 else:
773 l = h.new(self.lines)
773 l = h.new(self.lines)
774 self.lines[:] = l
774 self.lines[:] = l
775 self.offset += len(l)
775 self.offset += len(l)
776 self.dirty = True
776 self.dirty = True
777 return 0
777 return 0
778
778
779 horig = h
779 horig = h
780 if (self.eolmode in ('crlf', 'lf')
780 if (self.eolmode in ('crlf', 'lf')
781 or self.eolmode == 'auto' and self.eol):
781 or self.eolmode == 'auto' and self.eol):
782 # If new eols are going to be normalized, then normalize
782 # If new eols are going to be normalized, then normalize
783 # hunk data before patching. Otherwise, preserve input
783 # hunk data before patching. Otherwise, preserve input
784 # line-endings.
784 # line-endings.
785 h = h.getnormalized()
785 h = h.getnormalized()
786
786
787 # fast case first, no offsets, no fuzz
787 # fast case first, no offsets, no fuzz
788 old, oldstart, new, newstart = h.fuzzit(0, False)
788 old, oldstart, new, newstart = h.fuzzit(0, False)
789 oldstart += self.offset
789 oldstart += self.offset
790 orig_start = oldstart
790 orig_start = oldstart
791 # if there's skew we want to emit the "(offset %d lines)" even
791 # if there's skew we want to emit the "(offset %d lines)" even
792 # when the hunk cleanly applies at start + skew, so skip the
792 # when the hunk cleanly applies at start + skew, so skip the
793 # fast case code
793 # fast case code
794 if (self.skew == 0 and
794 if (self.skew == 0 and
795 diffhelpers.testhunk(old, self.lines, oldstart) == 0):
795 diffhelpers.testhunk(old, self.lines, oldstart) == 0):
796 if self.remove:
796 if self.remove:
797 self.backend.unlink(self.fname)
797 self.backend.unlink(self.fname)
798 else:
798 else:
799 self.lines[oldstart:oldstart + len(old)] = new
799 self.lines[oldstart:oldstart + len(old)] = new
800 self.offset += len(new) - len(old)
800 self.offset += len(new) - len(old)
801 self.dirty = True
801 self.dirty = True
802 return 0
802 return 0
803
803
804 # ok, we couldn't match the hunk. Lets look for offsets and fuzz it
804 # ok, we couldn't match the hunk. Lets look for offsets and fuzz it
805 self.hash = {}
805 self.hash = {}
806 for x, s in enumerate(self.lines):
806 for x, s in enumerate(self.lines):
807 self.hash.setdefault(s, []).append(x)
807 self.hash.setdefault(s, []).append(x)
808
808
809 for fuzzlen in xrange(self.ui.configint("patch", "fuzz") + 1):
809 for fuzzlen in xrange(self.ui.configint("patch", "fuzz") + 1):
810 for toponly in [True, False]:
810 for toponly in [True, False]:
811 old, oldstart, new, newstart = h.fuzzit(fuzzlen, toponly)
811 old, oldstart, new, newstart = h.fuzzit(fuzzlen, toponly)
812 oldstart = oldstart + self.offset + self.skew
812 oldstart = oldstart + self.offset + self.skew
813 oldstart = min(oldstart, len(self.lines))
813 oldstart = min(oldstart, len(self.lines))
814 if old:
814 if old:
815 cand = self.findlines(old[0][1:], oldstart)
815 cand = self.findlines(old[0][1:], oldstart)
816 else:
816 else:
817 # Only adding lines with no or fuzzed context, just
817 # Only adding lines with no or fuzzed context, just
818 # take the skew in account
818 # take the skew in account
819 cand = [oldstart]
819 cand = [oldstart]
820
820
821 for l in cand:
821 for l in cand:
822 if not old or diffhelpers.testhunk(old, self.lines, l) == 0:
822 if not old or diffhelpers.testhunk(old, self.lines, l) == 0:
823 self.lines[l : l + len(old)] = new
823 self.lines[l : l + len(old)] = new
824 self.offset += len(new) - len(old)
824 self.offset += len(new) - len(old)
825 self.skew = l - orig_start
825 self.skew = l - orig_start
826 self.dirty = True
826 self.dirty = True
827 offset = l - orig_start - fuzzlen
827 offset = l - orig_start - fuzzlen
828 if fuzzlen:
828 if fuzzlen:
829 msg = _("Hunk #%d succeeded at %d "
829 msg = _("Hunk #%d succeeded at %d "
830 "with fuzz %d "
830 "with fuzz %d "
831 "(offset %d lines).\n")
831 "(offset %d lines).\n")
832 self.printfile(True)
832 self.printfile(True)
833 self.ui.warn(msg %
833 self.ui.warn(msg %
834 (h.number, l + 1, fuzzlen, offset))
834 (h.number, l + 1, fuzzlen, offset))
835 else:
835 else:
836 msg = _("Hunk #%d succeeded at %d "
836 msg = _("Hunk #%d succeeded at %d "
837 "(offset %d lines).\n")
837 "(offset %d lines).\n")
838 self.ui.note(msg % (h.number, l + 1, offset))
838 self.ui.note(msg % (h.number, l + 1, offset))
839 return fuzzlen
839 return fuzzlen
840 self.printfile(True)
840 self.printfile(True)
841 self.ui.warn(_("Hunk #%d FAILED at %d\n") % (h.number, orig_start))
841 self.ui.warn(_("Hunk #%d FAILED at %d\n") % (h.number, orig_start))
842 self.rej.append(horig)
842 self.rej.append(horig)
843 return -1
843 return -1
844
844
845 def close(self):
845 def close(self):
846 if self.dirty:
846 if self.dirty:
847 self.writelines(self.fname, self.lines, self.mode)
847 self.writelines(self.fname, self.lines, self.mode)
848 self.write_rej()
848 self.write_rej()
849 return len(self.rej)
849 return len(self.rej)
850
850
851 class header(object):
851 class header(object):
852 """patch header
852 """patch header
853 """
853 """
854 diffgit_re = re.compile('diff --git a/(.*) b/(.*)$')
854 diffgit_re = re.compile('diff --git a/(.*) b/(.*)$')
855 diff_re = re.compile('diff -r .* (.*)$')
855 diff_re = re.compile('diff -r .* (.*)$')
856 allhunks_re = re.compile('(?:index|deleted file) ')
856 allhunks_re = re.compile('(?:index|deleted file) ')
857 pretty_re = re.compile('(?:new file|deleted file) ')
857 pretty_re = re.compile('(?:new file|deleted file) ')
858 special_re = re.compile('(?:index|deleted|copy|rename) ')
858 special_re = re.compile('(?:index|deleted|copy|rename) ')
859 newfile_re = re.compile('(?:new file)')
859 newfile_re = re.compile('(?:new file)')
860
860
861 def __init__(self, header):
861 def __init__(self, header):
862 self.header = header
862 self.header = header
863 self.hunks = []
863 self.hunks = []
864
864
865 def binary(self):
865 def binary(self):
866 return any(h.startswith('index ') for h in self.header)
866 return any(h.startswith('index ') for h in self.header)
867
867
868 def pretty(self, fp):
868 def pretty(self, fp):
869 for h in self.header:
869 for h in self.header:
870 if h.startswith('index '):
870 if h.startswith('index '):
871 fp.write(_('this modifies a binary file (all or nothing)\n'))
871 fp.write(_('this modifies a binary file (all or nothing)\n'))
872 break
872 break
873 if self.pretty_re.match(h):
873 if self.pretty_re.match(h):
874 fp.write(h)
874 fp.write(h)
875 if self.binary():
875 if self.binary():
876 fp.write(_('this is a binary file\n'))
876 fp.write(_('this is a binary file\n'))
877 break
877 break
878 if h.startswith('---'):
878 if h.startswith('---'):
879 fp.write(_('%d hunks, %d lines changed\n') %
879 fp.write(_('%d hunks, %d lines changed\n') %
880 (len(self.hunks),
880 (len(self.hunks),
881 sum([max(h.added, h.removed) for h in self.hunks])))
881 sum([max(h.added, h.removed) for h in self.hunks])))
882 break
882 break
883 fp.write(h)
883 fp.write(h)
884
884
885 def write(self, fp):
885 def write(self, fp):
886 fp.write(''.join(self.header))
886 fp.write(''.join(self.header))
887
887
888 def allhunks(self):
888 def allhunks(self):
889 return any(self.allhunks_re.match(h) for h in self.header)
889 return any(self.allhunks_re.match(h) for h in self.header)
890
890
891 def files(self):
891 def files(self):
892 match = self.diffgit_re.match(self.header[0])
892 match = self.diffgit_re.match(self.header[0])
893 if match:
893 if match:
894 fromfile, tofile = match.groups()
894 fromfile, tofile = match.groups()
895 if fromfile == tofile:
895 if fromfile == tofile:
896 return [fromfile]
896 return [fromfile]
897 return [fromfile, tofile]
897 return [fromfile, tofile]
898 else:
898 else:
899 return self.diff_re.match(self.header[0]).groups()
899 return self.diff_re.match(self.header[0]).groups()
900
900
901 def filename(self):
901 def filename(self):
902 return self.files()[-1]
902 return self.files()[-1]
903
903
904 def __repr__(self):
904 def __repr__(self):
905 return '<header %s>' % (' '.join(map(repr, self.files())))
905 return '<header %s>' % (' '.join(map(repr, self.files())))
906
906
907 def isnewfile(self):
907 def isnewfile(self):
908 return any(self.newfile_re.match(h) for h in self.header)
908 return any(self.newfile_re.match(h) for h in self.header)
909
909
910 def special(self):
910 def special(self):
911 # Special files are shown only at the header level and not at the hunk
911 # Special files are shown only at the header level and not at the hunk
912 # level for example a file that has been deleted is a special file.
912 # level for example a file that has been deleted is a special file.
913 # The user cannot change the content of the operation, in the case of
913 # The user cannot change the content of the operation, in the case of
914 # the deleted file he has to take the deletion or not take it, he
914 # the deleted file he has to take the deletion or not take it, he
915 # cannot take some of it.
915 # cannot take some of it.
916 # Newly added files are special if they are empty, they are not special
916 # Newly added files are special if they are empty, they are not special
917 # if they have some content as we want to be able to change it
917 # if they have some content as we want to be able to change it
918 nocontent = len(self.header) == 2
918 nocontent = len(self.header) == 2
919 emptynewfile = self.isnewfile() and nocontent
919 emptynewfile = self.isnewfile() and nocontent
920 return emptynewfile or \
920 return emptynewfile or \
921 any(self.special_re.match(h) for h in self.header)
921 any(self.special_re.match(h) for h in self.header)
922
922
923 class recordhunk(object):
923 class recordhunk(object):
924 """patch hunk
924 """patch hunk
925
925
926 XXX shouldn't we merge this with the other hunk class?
926 XXX shouldn't we merge this with the other hunk class?
927 """
927 """
928
928
929 def __init__(self, header, fromline, toline, proc, before, hunk, after,
929 def __init__(self, header, fromline, toline, proc, before, hunk, after,
930 maxcontext=None):
930 maxcontext=None):
931 def trimcontext(lines, reverse=False):
931 def trimcontext(lines, reverse=False):
932 if maxcontext is not None:
932 if maxcontext is not None:
933 delta = len(lines) - maxcontext
933 delta = len(lines) - maxcontext
934 if delta > 0:
934 if delta > 0:
935 if reverse:
935 if reverse:
936 return delta, lines[delta:]
936 return delta, lines[delta:]
937 else:
937 else:
938 return delta, lines[:maxcontext]
938 return delta, lines[:maxcontext]
939 return 0, lines
939 return 0, lines
940
940
941 self.header = header
941 self.header = header
942 trimedbefore, self.before = trimcontext(before, True)
942 trimedbefore, self.before = trimcontext(before, True)
943 self.fromline = fromline + trimedbefore
943 self.fromline = fromline + trimedbefore
944 self.toline = toline + trimedbefore
944 self.toline = toline + trimedbefore
945 _trimedafter, self.after = trimcontext(after, False)
945 _trimedafter, self.after = trimcontext(after, False)
946 self.proc = proc
946 self.proc = proc
947 self.hunk = hunk
947 self.hunk = hunk
948 self.added, self.removed = self.countchanges(self.hunk)
948 self.added, self.removed = self.countchanges(self.hunk)
949
949
950 def __eq__(self, v):
950 def __eq__(self, v):
951 if not isinstance(v, recordhunk):
951 if not isinstance(v, recordhunk):
952 return False
952 return False
953
953
954 return ((v.hunk == self.hunk) and
954 return ((v.hunk == self.hunk) and
955 (v.proc == self.proc) and
955 (v.proc == self.proc) and
956 (self.fromline == v.fromline) and
956 (self.fromline == v.fromline) and
957 (self.header.files() == v.header.files()))
957 (self.header.files() == v.header.files()))
958
958
959 def __hash__(self):
959 def __hash__(self):
960 return hash((tuple(self.hunk),
960 return hash((tuple(self.hunk),
961 tuple(self.header.files()),
961 tuple(self.header.files()),
962 self.fromline,
962 self.fromline,
963 self.proc))
963 self.proc))
964
964
965 def countchanges(self, hunk):
965 def countchanges(self, hunk):
966 """hunk -> (n+,n-)"""
966 """hunk -> (n+,n-)"""
967 add = len([h for h in hunk if h.startswith('+')])
967 add = len([h for h in hunk if h.startswith('+')])
968 rem = len([h for h in hunk if h.startswith('-')])
968 rem = len([h for h in hunk if h.startswith('-')])
969 return add, rem
969 return add, rem
970
970
971 def reversehunk(self):
971 def reversehunk(self):
972 """return another recordhunk which is the reverse of the hunk
972 """return another recordhunk which is the reverse of the hunk
973
973
974 If this hunk is diff(A, B), the returned hunk is diff(B, A). To do
974 If this hunk is diff(A, B), the returned hunk is diff(B, A). To do
975 that, swap fromline/toline and +/- signs while keep other things
975 that, swap fromline/toline and +/- signs while keep other things
976 unchanged.
976 unchanged.
977 """
977 """
978 m = {'+': '-', '-': '+', '\\': '\\'}
978 m = {'+': '-', '-': '+', '\\': '\\'}
979 hunk = ['%s%s' % (m[l[0:1]], l[1:]) for l in self.hunk]
979 hunk = ['%s%s' % (m[l[0:1]], l[1:]) for l in self.hunk]
980 return recordhunk(self.header, self.toline, self.fromline, self.proc,
980 return recordhunk(self.header, self.toline, self.fromline, self.proc,
981 self.before, hunk, self.after)
981 self.before, hunk, self.after)
982
982
983 def write(self, fp):
983 def write(self, fp):
984 delta = len(self.before) + len(self.after)
984 delta = len(self.before) + len(self.after)
985 if self.after and self.after[-1] == '\\ No newline at end of file\n':
985 if self.after and self.after[-1] == '\\ No newline at end of file\n':
986 delta -= 1
986 delta -= 1
987 fromlen = delta + self.removed
987 fromlen = delta + self.removed
988 tolen = delta + self.added
988 tolen = delta + self.added
989 fp.write('@@ -%d,%d +%d,%d @@%s\n' %
989 fp.write('@@ -%d,%d +%d,%d @@%s\n' %
990 (self.fromline, fromlen, self.toline, tolen,
990 (self.fromline, fromlen, self.toline, tolen,
991 self.proc and (' ' + self.proc)))
991 self.proc and (' ' + self.proc)))
992 fp.write(''.join(self.before + self.hunk + self.after))
992 fp.write(''.join(self.before + self.hunk + self.after))
993
993
994 pretty = write
994 pretty = write
995
995
996 def filename(self):
996 def filename(self):
997 return self.header.filename()
997 return self.header.filename()
998
998
999 def __repr__(self):
999 def __repr__(self):
1000 return '<hunk %r@%d>' % (self.filename(), self.fromline)
1000 return '<hunk %r@%d>' % (self.filename(), self.fromline)
1001
1001
1002 def getmessages():
1002 def getmessages():
1003 return {
1003 return {
1004 'multiple': {
1004 'multiple': {
1005 'apply': _("apply change %d/%d to '%s'?"),
1005 'apply': _("apply change %d/%d to '%s'?"),
1006 'discard': _("discard change %d/%d to '%s'?"),
1006 'discard': _("discard change %d/%d to '%s'?"),
1007 'record': _("record change %d/%d to '%s'?"),
1007 'record': _("record change %d/%d to '%s'?"),
1008 },
1008 },
1009 'single': {
1009 'single': {
1010 'apply': _("apply this change to '%s'?"),
1010 'apply': _("apply this change to '%s'?"),
1011 'discard': _("discard this change to '%s'?"),
1011 'discard': _("discard this change to '%s'?"),
1012 'record': _("record this change to '%s'?"),
1012 'record': _("record this change to '%s'?"),
1013 },
1013 },
1014 'help': {
1014 'help': {
1015 'apply': _('[Ynesfdaq?]'
1015 'apply': _('[Ynesfdaq?]'
1016 '$$ &Yes, apply this change'
1016 '$$ &Yes, apply this change'
1017 '$$ &No, skip this change'
1017 '$$ &No, skip this change'
1018 '$$ &Edit this change manually'
1018 '$$ &Edit this change manually'
1019 '$$ &Skip remaining changes to this file'
1019 '$$ &Skip remaining changes to this file'
1020 '$$ Apply remaining changes to this &file'
1020 '$$ Apply remaining changes to this &file'
1021 '$$ &Done, skip remaining changes and files'
1021 '$$ &Done, skip remaining changes and files'
1022 '$$ Apply &all changes to all remaining files'
1022 '$$ Apply &all changes to all remaining files'
1023 '$$ &Quit, applying no changes'
1023 '$$ &Quit, applying no changes'
1024 '$$ &? (display help)'),
1024 '$$ &? (display help)'),
1025 'discard': _('[Ynesfdaq?]'
1025 'discard': _('[Ynesfdaq?]'
1026 '$$ &Yes, discard this change'
1026 '$$ &Yes, discard this change'
1027 '$$ &No, skip this change'
1027 '$$ &No, skip this change'
1028 '$$ &Edit this change manually'
1028 '$$ &Edit this change manually'
1029 '$$ &Skip remaining changes to this file'
1029 '$$ &Skip remaining changes to this file'
1030 '$$ Discard remaining changes to this &file'
1030 '$$ Discard remaining changes to this &file'
1031 '$$ &Done, skip remaining changes and files'
1031 '$$ &Done, skip remaining changes and files'
1032 '$$ Discard &all changes to all remaining files'
1032 '$$ Discard &all changes to all remaining files'
1033 '$$ &Quit, discarding no changes'
1033 '$$ &Quit, discarding no changes'
1034 '$$ &? (display help)'),
1034 '$$ &? (display help)'),
1035 'record': _('[Ynesfdaq?]'
1035 'record': _('[Ynesfdaq?]'
1036 '$$ &Yes, record this change'
1036 '$$ &Yes, record this change'
1037 '$$ &No, skip this change'
1037 '$$ &No, skip this change'
1038 '$$ &Edit this change manually'
1038 '$$ &Edit this change manually'
1039 '$$ &Skip remaining changes to this file'
1039 '$$ &Skip remaining changes to this file'
1040 '$$ Record remaining changes to this &file'
1040 '$$ Record remaining changes to this &file'
1041 '$$ &Done, skip remaining changes and files'
1041 '$$ &Done, skip remaining changes and files'
1042 '$$ Record &all changes to all remaining files'
1042 '$$ Record &all changes to all remaining files'
1043 '$$ &Quit, recording no changes'
1043 '$$ &Quit, recording no changes'
1044 '$$ &? (display help)'),
1044 '$$ &? (display help)'),
1045 }
1045 }
1046 }
1046 }
1047
1047
1048 def filterpatch(ui, headers, operation=None):
1048 def filterpatch(ui, headers, operation=None):
1049 """Interactively filter patch chunks into applied-only chunks"""
1049 """Interactively filter patch chunks into applied-only chunks"""
1050 messages = getmessages()
1050 messages = getmessages()
1051
1051
1052 if operation is None:
1052 if operation is None:
1053 operation = 'record'
1053 operation = 'record'
1054
1054
1055 def prompt(skipfile, skipall, query, chunk):
1055 def prompt(skipfile, skipall, query, chunk):
1056 """prompt query, and process base inputs
1056 """prompt query, and process base inputs
1057
1057
1058 - y/n for the rest of file
1058 - y/n for the rest of file
1059 - y/n for the rest
1059 - y/n for the rest
1060 - ? (help)
1060 - ? (help)
1061 - q (quit)
1061 - q (quit)
1062
1062
1063 Return True/False and possibly updated skipfile and skipall.
1063 Return True/False and possibly updated skipfile and skipall.
1064 """
1064 """
1065 newpatches = None
1065 newpatches = None
1066 if skipall is not None:
1066 if skipall is not None:
1067 return skipall, skipfile, skipall, newpatches
1067 return skipall, skipfile, skipall, newpatches
1068 if skipfile is not None:
1068 if skipfile is not None:
1069 return skipfile, skipfile, skipall, newpatches
1069 return skipfile, skipfile, skipall, newpatches
1070 while True:
1070 while True:
1071 resps = messages['help'][operation]
1071 resps = messages['help'][operation]
1072 r = ui.promptchoice("%s %s" % (query, resps))
1072 r = ui.promptchoice("%s %s" % (query, resps))
1073 ui.write("\n")
1073 ui.write("\n")
1074 if r == 8: # ?
1074 if r == 8: # ?
1075 for c, t in ui.extractchoices(resps)[1]:
1075 for c, t in ui.extractchoices(resps)[1]:
1076 ui.write('%s - %s\n' % (c, encoding.lower(t)))
1076 ui.write('%s - %s\n' % (c, encoding.lower(t)))
1077 continue
1077 continue
1078 elif r == 0: # yes
1078 elif r == 0: # yes
1079 ret = True
1079 ret = True
1080 elif r == 1: # no
1080 elif r == 1: # no
1081 ret = False
1081 ret = False
1082 elif r == 2: # Edit patch
1082 elif r == 2: # Edit patch
1083 if chunk is None:
1083 if chunk is None:
1084 ui.write(_('cannot edit patch for whole file'))
1084 ui.write(_('cannot edit patch for whole file'))
1085 ui.write("\n")
1085 ui.write("\n")
1086 continue
1086 continue
1087 if chunk.header.binary():
1087 if chunk.header.binary():
1088 ui.write(_('cannot edit patch for binary file'))
1088 ui.write(_('cannot edit patch for binary file'))
1089 ui.write("\n")
1089 ui.write("\n")
1090 continue
1090 continue
1091 # Patch comment based on the Git one (based on comment at end of
1091 # Patch comment based on the Git one (based on comment at end of
1092 # https://mercurial-scm.org/wiki/RecordExtension)
1092 # https://mercurial-scm.org/wiki/RecordExtension)
1093 phelp = '---' + _("""
1093 phelp = '---' + _("""
1094 To remove '-' lines, make them ' ' lines (context).
1094 To remove '-' lines, make them ' ' lines (context).
1095 To remove '+' lines, delete them.
1095 To remove '+' lines, delete them.
1096 Lines starting with # will be removed from the patch.
1096 Lines starting with # will be removed from the patch.
1097
1097
1098 If the patch applies cleanly, the edited hunk will immediately be
1098 If the patch applies cleanly, the edited hunk will immediately be
1099 added to the record list. If it does not apply cleanly, a rejects
1099 added to the record list. If it does not apply cleanly, a rejects
1100 file will be generated: you can use that when you try again. If
1100 file will be generated: you can use that when you try again. If
1101 all lines of the hunk are removed, then the edit is aborted and
1101 all lines of the hunk are removed, then the edit is aborted and
1102 the hunk is left unchanged.
1102 the hunk is left unchanged.
1103 """)
1103 """)
1104 (patchfd, patchfn) = tempfile.mkstemp(prefix="hg-editor-",
1104 (patchfd, patchfn) = tempfile.mkstemp(prefix="hg-editor-",
1105 suffix=".diff", text=True)
1105 suffix=".diff", text=True)
1106 ncpatchfp = None
1106 ncpatchfp = None
1107 try:
1107 try:
1108 # Write the initial patch
1108 # Write the initial patch
1109 f = os.fdopen(patchfd, pycompat.sysstr("w"))
1109 f = os.fdopen(patchfd, pycompat.sysstr("w"))
1110 chunk.header.write(f)
1110 chunk.header.write(f)
1111 chunk.write(f)
1111 chunk.write(f)
1112 f.write('\n'.join(['# ' + i for i in phelp.splitlines()]))
1112 f.write('\n'.join(['# ' + i for i in phelp.splitlines()]))
1113 f.close()
1113 f.close()
1114 # Start the editor and wait for it to complete
1114 # Start the editor and wait for it to complete
1115 editor = ui.geteditor()
1115 editor = ui.geteditor()
1116 ret = ui.system("%s \"%s\"" % (editor, patchfn),
1116 ret = ui.system("%s \"%s\"" % (editor, patchfn),
1117 environ={'HGUSER': ui.username()},
1117 environ={'HGUSER': ui.username()},
1118 blockedtag='filterpatch')
1118 blockedtag='filterpatch')
1119 if ret != 0:
1119 if ret != 0:
1120 ui.warn(_("editor exited with exit code %d\n") % ret)
1120 ui.warn(_("editor exited with exit code %d\n") % ret)
1121 continue
1121 continue
1122 # Remove comment lines
1122 # Remove comment lines
1123 patchfp = open(patchfn)
1123 patchfp = open(patchfn)
1124 ncpatchfp = stringio()
1124 ncpatchfp = stringio()
1125 for line in util.iterfile(patchfp):
1125 for line in util.iterfile(patchfp):
1126 if not line.startswith('#'):
1126 if not line.startswith('#'):
1127 ncpatchfp.write(line)
1127 ncpatchfp.write(line)
1128 patchfp.close()
1128 patchfp.close()
1129 ncpatchfp.seek(0)
1129 ncpatchfp.seek(0)
1130 newpatches = parsepatch(ncpatchfp)
1130 newpatches = parsepatch(ncpatchfp)
1131 finally:
1131 finally:
1132 os.unlink(patchfn)
1132 os.unlink(patchfn)
1133 del ncpatchfp
1133 del ncpatchfp
1134 # Signal that the chunk shouldn't be applied as-is, but
1134 # Signal that the chunk shouldn't be applied as-is, but
1135 # provide the new patch to be used instead.
1135 # provide the new patch to be used instead.
1136 ret = False
1136 ret = False
1137 elif r == 3: # Skip
1137 elif r == 3: # Skip
1138 ret = skipfile = False
1138 ret = skipfile = False
1139 elif r == 4: # file (Record remaining)
1139 elif r == 4: # file (Record remaining)
1140 ret = skipfile = True
1140 ret = skipfile = True
1141 elif r == 5: # done, skip remaining
1141 elif r == 5: # done, skip remaining
1142 ret = skipall = False
1142 ret = skipall = False
1143 elif r == 6: # all
1143 elif r == 6: # all
1144 ret = skipall = True
1144 ret = skipall = True
1145 elif r == 7: # quit
1145 elif r == 7: # quit
1146 raise error.Abort(_('user quit'))
1146 raise error.Abort(_('user quit'))
1147 return ret, skipfile, skipall, newpatches
1147 return ret, skipfile, skipall, newpatches
1148
1148
1149 seen = set()
1149 seen = set()
1150 applied = {} # 'filename' -> [] of chunks
1150 applied = {} # 'filename' -> [] of chunks
1151 skipfile, skipall = None, None
1151 skipfile, skipall = None, None
1152 pos, total = 1, sum(len(h.hunks) for h in headers)
1152 pos, total = 1, sum(len(h.hunks) for h in headers)
1153 for h in headers:
1153 for h in headers:
1154 pos += len(h.hunks)
1154 pos += len(h.hunks)
1155 skipfile = None
1155 skipfile = None
1156 fixoffset = 0
1156 fixoffset = 0
1157 hdr = ''.join(h.header)
1157 hdr = ''.join(h.header)
1158 if hdr in seen:
1158 if hdr in seen:
1159 continue
1159 continue
1160 seen.add(hdr)
1160 seen.add(hdr)
1161 if skipall is None:
1161 if skipall is None:
1162 h.pretty(ui)
1162 h.pretty(ui)
1163 msg = (_('examine changes to %s?') %
1163 msg = (_('examine changes to %s?') %
1164 _(' and ').join("'%s'" % f for f in h.files()))
1164 _(' and ').join("'%s'" % f for f in h.files()))
1165 r, skipfile, skipall, np = prompt(skipfile, skipall, msg, None)
1165 r, skipfile, skipall, np = prompt(skipfile, skipall, msg, None)
1166 if not r:
1166 if not r:
1167 continue
1167 continue
1168 applied[h.filename()] = [h]
1168 applied[h.filename()] = [h]
1169 if h.allhunks():
1169 if h.allhunks():
1170 applied[h.filename()] += h.hunks
1170 applied[h.filename()] += h.hunks
1171 continue
1171 continue
1172 for i, chunk in enumerate(h.hunks):
1172 for i, chunk in enumerate(h.hunks):
1173 if skipfile is None and skipall is None:
1173 if skipfile is None and skipall is None:
1174 chunk.pretty(ui)
1174 chunk.pretty(ui)
1175 if total == 1:
1175 if total == 1:
1176 msg = messages['single'][operation] % chunk.filename()
1176 msg = messages['single'][operation] % chunk.filename()
1177 else:
1177 else:
1178 idx = pos - len(h.hunks) + i
1178 idx = pos - len(h.hunks) + i
1179 msg = messages['multiple'][operation] % (idx, total,
1179 msg = messages['multiple'][operation] % (idx, total,
1180 chunk.filename())
1180 chunk.filename())
1181 r, skipfile, skipall, newpatches = prompt(skipfile,
1181 r, skipfile, skipall, newpatches = prompt(skipfile,
1182 skipall, msg, chunk)
1182 skipall, msg, chunk)
1183 if r:
1183 if r:
1184 if fixoffset:
1184 if fixoffset:
1185 chunk = copy.copy(chunk)
1185 chunk = copy.copy(chunk)
1186 chunk.toline += fixoffset
1186 chunk.toline += fixoffset
1187 applied[chunk.filename()].append(chunk)
1187 applied[chunk.filename()].append(chunk)
1188 elif newpatches is not None:
1188 elif newpatches is not None:
1189 for newpatch in newpatches:
1189 for newpatch in newpatches:
1190 for newhunk in newpatch.hunks:
1190 for newhunk in newpatch.hunks:
1191 if fixoffset:
1191 if fixoffset:
1192 newhunk.toline += fixoffset
1192 newhunk.toline += fixoffset
1193 applied[newhunk.filename()].append(newhunk)
1193 applied[newhunk.filename()].append(newhunk)
1194 else:
1194 else:
1195 fixoffset += chunk.removed - chunk.added
1195 fixoffset += chunk.removed - chunk.added
1196 return (sum([h for h in applied.itervalues()
1196 return (sum([h for h in applied.itervalues()
1197 if h[0].special() or len(h) > 1], []), {})
1197 if h[0].special() or len(h) > 1], []), {})
1198 class hunk(object):
1198 class hunk(object):
1199 def __init__(self, desc, num, lr, context):
1199 def __init__(self, desc, num, lr, context):
1200 self.number = num
1200 self.number = num
1201 self.desc = desc
1201 self.desc = desc
1202 self.hunk = [desc]
1202 self.hunk = [desc]
1203 self.a = []
1203 self.a = []
1204 self.b = []
1204 self.b = []
1205 self.starta = self.lena = None
1205 self.starta = self.lena = None
1206 self.startb = self.lenb = None
1206 self.startb = self.lenb = None
1207 if lr is not None:
1207 if lr is not None:
1208 if context:
1208 if context:
1209 self.read_context_hunk(lr)
1209 self.read_context_hunk(lr)
1210 else:
1210 else:
1211 self.read_unified_hunk(lr)
1211 self.read_unified_hunk(lr)
1212
1212
1213 def getnormalized(self):
1213 def getnormalized(self):
1214 """Return a copy with line endings normalized to LF."""
1214 """Return a copy with line endings normalized to LF."""
1215
1215
1216 def normalize(lines):
1216 def normalize(lines):
1217 nlines = []
1217 nlines = []
1218 for line in lines:
1218 for line in lines:
1219 if line.endswith('\r\n'):
1219 if line.endswith('\r\n'):
1220 line = line[:-2] + '\n'
1220 line = line[:-2] + '\n'
1221 nlines.append(line)
1221 nlines.append(line)
1222 return nlines
1222 return nlines
1223
1223
1224 # Dummy object, it is rebuilt manually
1224 # Dummy object, it is rebuilt manually
1225 nh = hunk(self.desc, self.number, None, None)
1225 nh = hunk(self.desc, self.number, None, None)
1226 nh.number = self.number
1226 nh.number = self.number
1227 nh.desc = self.desc
1227 nh.desc = self.desc
1228 nh.hunk = self.hunk
1228 nh.hunk = self.hunk
1229 nh.a = normalize(self.a)
1229 nh.a = normalize(self.a)
1230 nh.b = normalize(self.b)
1230 nh.b = normalize(self.b)
1231 nh.starta = self.starta
1231 nh.starta = self.starta
1232 nh.startb = self.startb
1232 nh.startb = self.startb
1233 nh.lena = self.lena
1233 nh.lena = self.lena
1234 nh.lenb = self.lenb
1234 nh.lenb = self.lenb
1235 return nh
1235 return nh
1236
1236
1237 def read_unified_hunk(self, lr):
1237 def read_unified_hunk(self, lr):
1238 m = unidesc.match(self.desc)
1238 m = unidesc.match(self.desc)
1239 if not m:
1239 if not m:
1240 raise PatchError(_("bad hunk #%d") % self.number)
1240 raise PatchError(_("bad hunk #%d") % self.number)
1241 self.starta, self.lena, self.startb, self.lenb = m.groups()
1241 self.starta, self.lena, self.startb, self.lenb = m.groups()
1242 if self.lena is None:
1242 if self.lena is None:
1243 self.lena = 1
1243 self.lena = 1
1244 else:
1244 else:
1245 self.lena = int(self.lena)
1245 self.lena = int(self.lena)
1246 if self.lenb is None:
1246 if self.lenb is None:
1247 self.lenb = 1
1247 self.lenb = 1
1248 else:
1248 else:
1249 self.lenb = int(self.lenb)
1249 self.lenb = int(self.lenb)
1250 self.starta = int(self.starta)
1250 self.starta = int(self.starta)
1251 self.startb = int(self.startb)
1251 self.startb = int(self.startb)
1252 diffhelpers.addlines(lr, self.hunk, self.lena, self.lenb, self.a,
1252 diffhelpers.addlines(lr, self.hunk, self.lena, self.lenb, self.a,
1253 self.b)
1253 self.b)
1254 # if we hit eof before finishing out the hunk, the last line will
1254 # if we hit eof before finishing out the hunk, the last line will
1255 # be zero length. Lets try to fix it up.
1255 # be zero length. Lets try to fix it up.
1256 while len(self.hunk[-1]) == 0:
1256 while len(self.hunk[-1]) == 0:
1257 del self.hunk[-1]
1257 del self.hunk[-1]
1258 del self.a[-1]
1258 del self.a[-1]
1259 del self.b[-1]
1259 del self.b[-1]
1260 self.lena -= 1
1260 self.lena -= 1
1261 self.lenb -= 1
1261 self.lenb -= 1
1262 self._fixnewline(lr)
1262 self._fixnewline(lr)
1263
1263
1264 def read_context_hunk(self, lr):
1264 def read_context_hunk(self, lr):
1265 self.desc = lr.readline()
1265 self.desc = lr.readline()
1266 m = contextdesc.match(self.desc)
1266 m = contextdesc.match(self.desc)
1267 if not m:
1267 if not m:
1268 raise PatchError(_("bad hunk #%d") % self.number)
1268 raise PatchError(_("bad hunk #%d") % self.number)
1269 self.starta, aend = m.groups()
1269 self.starta, aend = m.groups()
1270 self.starta = int(self.starta)
1270 self.starta = int(self.starta)
1271 if aend is None:
1271 if aend is None:
1272 aend = self.starta
1272 aend = self.starta
1273 self.lena = int(aend) - self.starta
1273 self.lena = int(aend) - self.starta
1274 if self.starta:
1274 if self.starta:
1275 self.lena += 1
1275 self.lena += 1
1276 for x in xrange(self.lena):
1276 for x in xrange(self.lena):
1277 l = lr.readline()
1277 l = lr.readline()
1278 if l.startswith('---'):
1278 if l.startswith('---'):
1279 # lines addition, old block is empty
1279 # lines addition, old block is empty
1280 lr.push(l)
1280 lr.push(l)
1281 break
1281 break
1282 s = l[2:]
1282 s = l[2:]
1283 if l.startswith('- ') or l.startswith('! '):
1283 if l.startswith('- ') or l.startswith('! '):
1284 u = '-' + s
1284 u = '-' + s
1285 elif l.startswith(' '):
1285 elif l.startswith(' '):
1286 u = ' ' + s
1286 u = ' ' + s
1287 else:
1287 else:
1288 raise PatchError(_("bad hunk #%d old text line %d") %
1288 raise PatchError(_("bad hunk #%d old text line %d") %
1289 (self.number, x))
1289 (self.number, x))
1290 self.a.append(u)
1290 self.a.append(u)
1291 self.hunk.append(u)
1291 self.hunk.append(u)
1292
1292
1293 l = lr.readline()
1293 l = lr.readline()
1294 if l.startswith('\ '):
1294 if l.startswith('\ '):
1295 s = self.a[-1][:-1]
1295 s = self.a[-1][:-1]
1296 self.a[-1] = s
1296 self.a[-1] = s
1297 self.hunk[-1] = s
1297 self.hunk[-1] = s
1298 l = lr.readline()
1298 l = lr.readline()
1299 m = contextdesc.match(l)
1299 m = contextdesc.match(l)
1300 if not m:
1300 if not m:
1301 raise PatchError(_("bad hunk #%d") % self.number)
1301 raise PatchError(_("bad hunk #%d") % self.number)
1302 self.startb, bend = m.groups()
1302 self.startb, bend = m.groups()
1303 self.startb = int(self.startb)
1303 self.startb = int(self.startb)
1304 if bend is None:
1304 if bend is None:
1305 bend = self.startb
1305 bend = self.startb
1306 self.lenb = int(bend) - self.startb
1306 self.lenb = int(bend) - self.startb
1307 if self.startb:
1307 if self.startb:
1308 self.lenb += 1
1308 self.lenb += 1
1309 hunki = 1
1309 hunki = 1
1310 for x in xrange(self.lenb):
1310 for x in xrange(self.lenb):
1311 l = lr.readline()
1311 l = lr.readline()
1312 if l.startswith('\ '):
1312 if l.startswith('\ '):
1313 # XXX: the only way to hit this is with an invalid line range.
1313 # XXX: the only way to hit this is with an invalid line range.
1314 # The no-eol marker is not counted in the line range, but I
1314 # The no-eol marker is not counted in the line range, but I
1315 # guess there are diff(1) out there which behave differently.
1315 # guess there are diff(1) out there which behave differently.
1316 s = self.b[-1][:-1]
1316 s = self.b[-1][:-1]
1317 self.b[-1] = s
1317 self.b[-1] = s
1318 self.hunk[hunki - 1] = s
1318 self.hunk[hunki - 1] = s
1319 continue
1319 continue
1320 if not l:
1320 if not l:
1321 # line deletions, new block is empty and we hit EOF
1321 # line deletions, new block is empty and we hit EOF
1322 lr.push(l)
1322 lr.push(l)
1323 break
1323 break
1324 s = l[2:]
1324 s = l[2:]
1325 if l.startswith('+ ') or l.startswith('! '):
1325 if l.startswith('+ ') or l.startswith('! '):
1326 u = '+' + s
1326 u = '+' + s
1327 elif l.startswith(' '):
1327 elif l.startswith(' '):
1328 u = ' ' + s
1328 u = ' ' + s
1329 elif len(self.b) == 0:
1329 elif len(self.b) == 0:
1330 # line deletions, new block is empty
1330 # line deletions, new block is empty
1331 lr.push(l)
1331 lr.push(l)
1332 break
1332 break
1333 else:
1333 else:
1334 raise PatchError(_("bad hunk #%d old text line %d") %
1334 raise PatchError(_("bad hunk #%d old text line %d") %
1335 (self.number, x))
1335 (self.number, x))
1336 self.b.append(s)
1336 self.b.append(s)
1337 while True:
1337 while True:
1338 if hunki >= len(self.hunk):
1338 if hunki >= len(self.hunk):
1339 h = ""
1339 h = ""
1340 else:
1340 else:
1341 h = self.hunk[hunki]
1341 h = self.hunk[hunki]
1342 hunki += 1
1342 hunki += 1
1343 if h == u:
1343 if h == u:
1344 break
1344 break
1345 elif h.startswith('-'):
1345 elif h.startswith('-'):
1346 continue
1346 continue
1347 else:
1347 else:
1348 self.hunk.insert(hunki - 1, u)
1348 self.hunk.insert(hunki - 1, u)
1349 break
1349 break
1350
1350
1351 if not self.a:
1351 if not self.a:
1352 # this happens when lines were only added to the hunk
1352 # this happens when lines were only added to the hunk
1353 for x in self.hunk:
1353 for x in self.hunk:
1354 if x.startswith('-') or x.startswith(' '):
1354 if x.startswith('-') or x.startswith(' '):
1355 self.a.append(x)
1355 self.a.append(x)
1356 if not self.b:
1356 if not self.b:
1357 # this happens when lines were only deleted from the hunk
1357 # this happens when lines were only deleted from the hunk
1358 for x in self.hunk:
1358 for x in self.hunk:
1359 if x.startswith('+') or x.startswith(' '):
1359 if x.startswith('+') or x.startswith(' '):
1360 self.b.append(x[1:])
1360 self.b.append(x[1:])
1361 # @@ -start,len +start,len @@
1361 # @@ -start,len +start,len @@
1362 self.desc = "@@ -%d,%d +%d,%d @@\n" % (self.starta, self.lena,
1362 self.desc = "@@ -%d,%d +%d,%d @@\n" % (self.starta, self.lena,
1363 self.startb, self.lenb)
1363 self.startb, self.lenb)
1364 self.hunk[0] = self.desc
1364 self.hunk[0] = self.desc
1365 self._fixnewline(lr)
1365 self._fixnewline(lr)
1366
1366
1367 def _fixnewline(self, lr):
1367 def _fixnewline(self, lr):
1368 l = lr.readline()
1368 l = lr.readline()
1369 if l.startswith('\ '):
1369 if l.startswith('\ '):
1370 diffhelpers.fix_newline(self.hunk, self.a, self.b)
1370 diffhelpers.fix_newline(self.hunk, self.a, self.b)
1371 else:
1371 else:
1372 lr.push(l)
1372 lr.push(l)
1373
1373
1374 def complete(self):
1374 def complete(self):
1375 return len(self.a) == self.lena and len(self.b) == self.lenb
1375 return len(self.a) == self.lena and len(self.b) == self.lenb
1376
1376
1377 def _fuzzit(self, old, new, fuzz, toponly):
1377 def _fuzzit(self, old, new, fuzz, toponly):
1378 # this removes context lines from the top and bottom of list 'l'. It
1378 # this removes context lines from the top and bottom of list 'l'. It
1379 # checks the hunk to make sure only context lines are removed, and then
1379 # checks the hunk to make sure only context lines are removed, and then
1380 # returns a new shortened list of lines.
1380 # returns a new shortened list of lines.
1381 fuzz = min(fuzz, len(old))
1381 fuzz = min(fuzz, len(old))
1382 if fuzz:
1382 if fuzz:
1383 top = 0
1383 top = 0
1384 bot = 0
1384 bot = 0
1385 hlen = len(self.hunk)
1385 hlen = len(self.hunk)
1386 for x in xrange(hlen - 1):
1386 for x in xrange(hlen - 1):
1387 # the hunk starts with the @@ line, so use x+1
1387 # the hunk starts with the @@ line, so use x+1
1388 if self.hunk[x + 1][0] == ' ':
1388 if self.hunk[x + 1][0] == ' ':
1389 top += 1
1389 top += 1
1390 else:
1390 else:
1391 break
1391 break
1392 if not toponly:
1392 if not toponly:
1393 for x in xrange(hlen - 1):
1393 for x in xrange(hlen - 1):
1394 if self.hunk[hlen - bot - 1][0] == ' ':
1394 if self.hunk[hlen - bot - 1][0] == ' ':
1395 bot += 1
1395 bot += 1
1396 else:
1396 else:
1397 break
1397 break
1398
1398
1399 bot = min(fuzz, bot)
1399 bot = min(fuzz, bot)
1400 top = min(fuzz, top)
1400 top = min(fuzz, top)
1401 return old[top:len(old) - bot], new[top:len(new) - bot], top
1401 return old[top:len(old) - bot], new[top:len(new) - bot], top
1402 return old, new, 0
1402 return old, new, 0
1403
1403
1404 def fuzzit(self, fuzz, toponly):
1404 def fuzzit(self, fuzz, toponly):
1405 old, new, top = self._fuzzit(self.a, self.b, fuzz, toponly)
1405 old, new, top = self._fuzzit(self.a, self.b, fuzz, toponly)
1406 oldstart = self.starta + top
1406 oldstart = self.starta + top
1407 newstart = self.startb + top
1407 newstart = self.startb + top
1408 # zero length hunk ranges already have their start decremented
1408 # zero length hunk ranges already have their start decremented
1409 if self.lena and oldstart > 0:
1409 if self.lena and oldstart > 0:
1410 oldstart -= 1
1410 oldstart -= 1
1411 if self.lenb and newstart > 0:
1411 if self.lenb and newstart > 0:
1412 newstart -= 1
1412 newstart -= 1
1413 return old, oldstart, new, newstart
1413 return old, oldstart, new, newstart
1414
1414
1415 class binhunk(object):
1415 class binhunk(object):
1416 'A binary patch file.'
1416 'A binary patch file.'
1417 def __init__(self, lr, fname):
1417 def __init__(self, lr, fname):
1418 self.text = None
1418 self.text = None
1419 self.delta = False
1419 self.delta = False
1420 self.hunk = ['GIT binary patch\n']
1420 self.hunk = ['GIT binary patch\n']
1421 self._fname = fname
1421 self._fname = fname
1422 self._read(lr)
1422 self._read(lr)
1423
1423
1424 def complete(self):
1424 def complete(self):
1425 return self.text is not None
1425 return self.text is not None
1426
1426
1427 def new(self, lines):
1427 def new(self, lines):
1428 if self.delta:
1428 if self.delta:
1429 return [applybindelta(self.text, ''.join(lines))]
1429 return [applybindelta(self.text, ''.join(lines))]
1430 return [self.text]
1430 return [self.text]
1431
1431
1432 def _read(self, lr):
1432 def _read(self, lr):
1433 def getline(lr, hunk):
1433 def getline(lr, hunk):
1434 l = lr.readline()
1434 l = lr.readline()
1435 hunk.append(l)
1435 hunk.append(l)
1436 return l.rstrip('\r\n')
1436 return l.rstrip('\r\n')
1437
1437
1438 size = 0
1438 size = 0
1439 while True:
1439 while True:
1440 line = getline(lr, self.hunk)
1440 line = getline(lr, self.hunk)
1441 if not line:
1441 if not line:
1442 raise PatchError(_('could not extract "%s" binary data')
1442 raise PatchError(_('could not extract "%s" binary data')
1443 % self._fname)
1443 % self._fname)
1444 if line.startswith('literal '):
1444 if line.startswith('literal '):
1445 size = int(line[8:].rstrip())
1445 size = int(line[8:].rstrip())
1446 break
1446 break
1447 if line.startswith('delta '):
1447 if line.startswith('delta '):
1448 size = int(line[6:].rstrip())
1448 size = int(line[6:].rstrip())
1449 self.delta = True
1449 self.delta = True
1450 break
1450 break
1451 dec = []
1451 dec = []
1452 line = getline(lr, self.hunk)
1452 line = getline(lr, self.hunk)
1453 while len(line) > 1:
1453 while len(line) > 1:
1454 l = line[0]
1454 l = line[0]
1455 if l <= 'Z' and l >= 'A':
1455 if l <= 'Z' and l >= 'A':
1456 l = ord(l) - ord('A') + 1
1456 l = ord(l) - ord('A') + 1
1457 else:
1457 else:
1458 l = ord(l) - ord('a') + 27
1458 l = ord(l) - ord('a') + 27
1459 try:
1459 try:
1460 dec.append(util.b85decode(line[1:])[:l])
1460 dec.append(util.b85decode(line[1:])[:l])
1461 except ValueError as e:
1461 except ValueError as e:
1462 raise PatchError(_('could not decode "%s" binary patch: %s')
1462 raise PatchError(_('could not decode "%s" binary patch: %s')
1463 % (self._fname, str(e)))
1463 % (self._fname, str(e)))
1464 line = getline(lr, self.hunk)
1464 line = getline(lr, self.hunk)
1465 text = zlib.decompress(''.join(dec))
1465 text = zlib.decompress(''.join(dec))
1466 if len(text) != size:
1466 if len(text) != size:
1467 raise PatchError(_('"%s" length is %d bytes, should be %d')
1467 raise PatchError(_('"%s" length is %d bytes, should be %d')
1468 % (self._fname, len(text), size))
1468 % (self._fname, len(text), size))
1469 self.text = text
1469 self.text = text
1470
1470
1471 def parsefilename(str):
1471 def parsefilename(str):
1472 # --- filename \t|space stuff
1472 # --- filename \t|space stuff
1473 s = str[4:].rstrip('\r\n')
1473 s = str[4:].rstrip('\r\n')
1474 i = s.find('\t')
1474 i = s.find('\t')
1475 if i < 0:
1475 if i < 0:
1476 i = s.find(' ')
1476 i = s.find(' ')
1477 if i < 0:
1477 if i < 0:
1478 return s
1478 return s
1479 return s[:i]
1479 return s[:i]
1480
1480
1481 def reversehunks(hunks):
1481 def reversehunks(hunks):
1482 '''reverse the signs in the hunks given as argument
1482 '''reverse the signs in the hunks given as argument
1483
1483
1484 This function operates on hunks coming out of patch.filterpatch, that is
1484 This function operates on hunks coming out of patch.filterpatch, that is
1485 a list of the form: [header1, hunk1, hunk2, header2...]. Example usage:
1485 a list of the form: [header1, hunk1, hunk2, header2...]. Example usage:
1486
1486
1487 >>> rawpatch = b"""diff --git a/folder1/g b/folder1/g
1487 >>> rawpatch = b"""diff --git a/folder1/g b/folder1/g
1488 ... --- a/folder1/g
1488 ... --- a/folder1/g
1489 ... +++ b/folder1/g
1489 ... +++ b/folder1/g
1490 ... @@ -1,7 +1,7 @@
1490 ... @@ -1,7 +1,7 @@
1491 ... +firstline
1491 ... +firstline
1492 ... c
1492 ... c
1493 ... 1
1493 ... 1
1494 ... 2
1494 ... 2
1495 ... + 3
1495 ... + 3
1496 ... -4
1496 ... -4
1497 ... 5
1497 ... 5
1498 ... d
1498 ... d
1499 ... +lastline"""
1499 ... +lastline"""
1500 >>> hunks = parsepatch([rawpatch])
1500 >>> hunks = parsepatch([rawpatch])
1501 >>> hunkscomingfromfilterpatch = []
1501 >>> hunkscomingfromfilterpatch = []
1502 >>> for h in hunks:
1502 >>> for h in hunks:
1503 ... hunkscomingfromfilterpatch.append(h)
1503 ... hunkscomingfromfilterpatch.append(h)
1504 ... hunkscomingfromfilterpatch.extend(h.hunks)
1504 ... hunkscomingfromfilterpatch.extend(h.hunks)
1505
1505
1506 >>> reversedhunks = reversehunks(hunkscomingfromfilterpatch)
1506 >>> reversedhunks = reversehunks(hunkscomingfromfilterpatch)
1507 >>> from . import util
1507 >>> from . import util
1508 >>> fp = util.stringio()
1508 >>> fp = util.stringio()
1509 >>> for c in reversedhunks:
1509 >>> for c in reversedhunks:
1510 ... c.write(fp)
1510 ... c.write(fp)
1511 >>> fp.seek(0) or None
1511 >>> fp.seek(0) or None
1512 >>> reversedpatch = fp.read()
1512 >>> reversedpatch = fp.read()
1513 >>> print(pycompat.sysstr(reversedpatch))
1513 >>> print(pycompat.sysstr(reversedpatch))
1514 diff --git a/folder1/g b/folder1/g
1514 diff --git a/folder1/g b/folder1/g
1515 --- a/folder1/g
1515 --- a/folder1/g
1516 +++ b/folder1/g
1516 +++ b/folder1/g
1517 @@ -1,4 +1,3 @@
1517 @@ -1,4 +1,3 @@
1518 -firstline
1518 -firstline
1519 c
1519 c
1520 1
1520 1
1521 2
1521 2
1522 @@ -2,6 +1,6 @@
1522 @@ -2,6 +1,6 @@
1523 c
1523 c
1524 1
1524 1
1525 2
1525 2
1526 - 3
1526 - 3
1527 +4
1527 +4
1528 5
1528 5
1529 d
1529 d
1530 @@ -6,3 +5,2 @@
1530 @@ -6,3 +5,2 @@
1531 5
1531 5
1532 d
1532 d
1533 -lastline
1533 -lastline
1534
1534
1535 '''
1535 '''
1536
1536
1537 newhunks = []
1537 newhunks = []
1538 for c in hunks:
1538 for c in hunks:
1539 if util.safehasattr(c, 'reversehunk'):
1539 if util.safehasattr(c, 'reversehunk'):
1540 c = c.reversehunk()
1540 c = c.reversehunk()
1541 newhunks.append(c)
1541 newhunks.append(c)
1542 return newhunks
1542 return newhunks
1543
1543
1544 def parsepatch(originalchunks, maxcontext=None):
1544 def parsepatch(originalchunks, maxcontext=None):
1545 """patch -> [] of headers -> [] of hunks
1545 """patch -> [] of headers -> [] of hunks
1546
1546
1547 If maxcontext is not None, trim context lines if necessary.
1547 If maxcontext is not None, trim context lines if necessary.
1548
1548
1549 >>> rawpatch = b'''diff --git a/folder1/g b/folder1/g
1549 >>> rawpatch = b'''diff --git a/folder1/g b/folder1/g
1550 ... --- a/folder1/g
1550 ... --- a/folder1/g
1551 ... +++ b/folder1/g
1551 ... +++ b/folder1/g
1552 ... @@ -1,8 +1,10 @@
1552 ... @@ -1,8 +1,10 @@
1553 ... 1
1553 ... 1
1554 ... 2
1554 ... 2
1555 ... -3
1555 ... -3
1556 ... 4
1556 ... 4
1557 ... 5
1557 ... 5
1558 ... 6
1558 ... 6
1559 ... +6.1
1559 ... +6.1
1560 ... +6.2
1560 ... +6.2
1561 ... 7
1561 ... 7
1562 ... 8
1562 ... 8
1563 ... +9'''
1563 ... +9'''
1564 >>> out = util.stringio()
1564 >>> out = util.stringio()
1565 >>> headers = parsepatch([rawpatch], maxcontext=1)
1565 >>> headers = parsepatch([rawpatch], maxcontext=1)
1566 >>> for header in headers:
1566 >>> for header in headers:
1567 ... header.write(out)
1567 ... header.write(out)
1568 ... for hunk in header.hunks:
1568 ... for hunk in header.hunks:
1569 ... hunk.write(out)
1569 ... hunk.write(out)
1570 >>> print(pycompat.sysstr(out.getvalue()))
1570 >>> print(pycompat.sysstr(out.getvalue()))
1571 diff --git a/folder1/g b/folder1/g
1571 diff --git a/folder1/g b/folder1/g
1572 --- a/folder1/g
1572 --- a/folder1/g
1573 +++ b/folder1/g
1573 +++ b/folder1/g
1574 @@ -2,3 +2,2 @@
1574 @@ -2,3 +2,2 @@
1575 2
1575 2
1576 -3
1576 -3
1577 4
1577 4
1578 @@ -6,2 +5,4 @@
1578 @@ -6,2 +5,4 @@
1579 6
1579 6
1580 +6.1
1580 +6.1
1581 +6.2
1581 +6.2
1582 7
1582 7
1583 @@ -8,1 +9,2 @@
1583 @@ -8,1 +9,2 @@
1584 8
1584 8
1585 +9
1585 +9
1586 """
1586 """
1587 class parser(object):
1587 class parser(object):
1588 """patch parsing state machine"""
1588 """patch parsing state machine"""
1589 def __init__(self):
1589 def __init__(self):
1590 self.fromline = 0
1590 self.fromline = 0
1591 self.toline = 0
1591 self.toline = 0
1592 self.proc = ''
1592 self.proc = ''
1593 self.header = None
1593 self.header = None
1594 self.context = []
1594 self.context = []
1595 self.before = []
1595 self.before = []
1596 self.hunk = []
1596 self.hunk = []
1597 self.headers = []
1597 self.headers = []
1598
1598
1599 def addrange(self, limits):
1599 def addrange(self, limits):
1600 fromstart, fromend, tostart, toend, proc = limits
1600 fromstart, fromend, tostart, toend, proc = limits
1601 self.fromline = int(fromstart)
1601 self.fromline = int(fromstart)
1602 self.toline = int(tostart)
1602 self.toline = int(tostart)
1603 self.proc = proc
1603 self.proc = proc
1604
1604
1605 def addcontext(self, context):
1605 def addcontext(self, context):
1606 if self.hunk:
1606 if self.hunk:
1607 h = recordhunk(self.header, self.fromline, self.toline,
1607 h = recordhunk(self.header, self.fromline, self.toline,
1608 self.proc, self.before, self.hunk, context, maxcontext)
1608 self.proc, self.before, self.hunk, context, maxcontext)
1609 self.header.hunks.append(h)
1609 self.header.hunks.append(h)
1610 self.fromline += len(self.before) + h.removed
1610 self.fromline += len(self.before) + h.removed
1611 self.toline += len(self.before) + h.added
1611 self.toline += len(self.before) + h.added
1612 self.before = []
1612 self.before = []
1613 self.hunk = []
1613 self.hunk = []
1614 self.context = context
1614 self.context = context
1615
1615
1616 def addhunk(self, hunk):
1616 def addhunk(self, hunk):
1617 if self.context:
1617 if self.context:
1618 self.before = self.context
1618 self.before = self.context
1619 self.context = []
1619 self.context = []
1620 self.hunk = hunk
1620 self.hunk = hunk
1621
1621
1622 def newfile(self, hdr):
1622 def newfile(self, hdr):
1623 self.addcontext([])
1623 self.addcontext([])
1624 h = header(hdr)
1624 h = header(hdr)
1625 self.headers.append(h)
1625 self.headers.append(h)
1626 self.header = h
1626 self.header = h
1627
1627
1628 def addother(self, line):
1628 def addother(self, line):
1629 pass # 'other' lines are ignored
1629 pass # 'other' lines are ignored
1630
1630
1631 def finished(self):
1631 def finished(self):
1632 self.addcontext([])
1632 self.addcontext([])
1633 return self.headers
1633 return self.headers
1634
1634
1635 transitions = {
1635 transitions = {
1636 'file': {'context': addcontext,
1636 'file': {'context': addcontext,
1637 'file': newfile,
1637 'file': newfile,
1638 'hunk': addhunk,
1638 'hunk': addhunk,
1639 'range': addrange},
1639 'range': addrange},
1640 'context': {'file': newfile,
1640 'context': {'file': newfile,
1641 'hunk': addhunk,
1641 'hunk': addhunk,
1642 'range': addrange,
1642 'range': addrange,
1643 'other': addother},
1643 'other': addother},
1644 'hunk': {'context': addcontext,
1644 'hunk': {'context': addcontext,
1645 'file': newfile,
1645 'file': newfile,
1646 'range': addrange},
1646 'range': addrange},
1647 'range': {'context': addcontext,
1647 'range': {'context': addcontext,
1648 'hunk': addhunk},
1648 'hunk': addhunk},
1649 'other': {'other': addother},
1649 'other': {'other': addother},
1650 }
1650 }
1651
1651
1652 p = parser()
1652 p = parser()
1653 fp = stringio()
1653 fp = stringio()
1654 fp.write(''.join(originalchunks))
1654 fp.write(''.join(originalchunks))
1655 fp.seek(0)
1655 fp.seek(0)
1656
1656
1657 state = 'context'
1657 state = 'context'
1658 for newstate, data in scanpatch(fp):
1658 for newstate, data in scanpatch(fp):
1659 try:
1659 try:
1660 p.transitions[state][newstate](p, data)
1660 p.transitions[state][newstate](p, data)
1661 except KeyError:
1661 except KeyError:
1662 raise PatchError('unhandled transition: %s -> %s' %
1662 raise PatchError('unhandled transition: %s -> %s' %
1663 (state, newstate))
1663 (state, newstate))
1664 state = newstate
1664 state = newstate
1665 del fp
1665 del fp
1666 return p.finished()
1666 return p.finished()
1667
1667
1668 def pathtransform(path, strip, prefix):
1668 def pathtransform(path, strip, prefix):
1669 '''turn a path from a patch into a path suitable for the repository
1669 '''turn a path from a patch into a path suitable for the repository
1670
1670
1671 prefix, if not empty, is expected to be normalized with a / at the end.
1671 prefix, if not empty, is expected to be normalized with a / at the end.
1672
1672
1673 Returns (stripped components, path in repository).
1673 Returns (stripped components, path in repository).
1674
1674
1675 >>> pathtransform(b'a/b/c', 0, b'')
1675 >>> pathtransform(b'a/b/c', 0, b'')
1676 ('', 'a/b/c')
1676 ('', 'a/b/c')
1677 >>> pathtransform(b' a/b/c ', 0, b'')
1677 >>> pathtransform(b' a/b/c ', 0, b'')
1678 ('', ' a/b/c')
1678 ('', ' a/b/c')
1679 >>> pathtransform(b' a/b/c ', 2, b'')
1679 >>> pathtransform(b' a/b/c ', 2, b'')
1680 ('a/b/', 'c')
1680 ('a/b/', 'c')
1681 >>> pathtransform(b'a/b/c', 0, b'd/e/')
1681 >>> pathtransform(b'a/b/c', 0, b'd/e/')
1682 ('', 'd/e/a/b/c')
1682 ('', 'd/e/a/b/c')
1683 >>> pathtransform(b' a//b/c ', 2, b'd/e/')
1683 >>> pathtransform(b' a//b/c ', 2, b'd/e/')
1684 ('a//b/', 'd/e/c')
1684 ('a//b/', 'd/e/c')
1685 >>> pathtransform(b'a/b/c', 3, b'')
1685 >>> pathtransform(b'a/b/c', 3, b'')
1686 Traceback (most recent call last):
1686 Traceback (most recent call last):
1687 PatchError: unable to strip away 1 of 3 dirs from a/b/c
1687 PatchError: unable to strip away 1 of 3 dirs from a/b/c
1688 '''
1688 '''
1689 pathlen = len(path)
1689 pathlen = len(path)
1690 i = 0
1690 i = 0
1691 if strip == 0:
1691 if strip == 0:
1692 return '', prefix + path.rstrip()
1692 return '', prefix + path.rstrip()
1693 count = strip
1693 count = strip
1694 while count > 0:
1694 while count > 0:
1695 i = path.find('/', i)
1695 i = path.find('/', i)
1696 if i == -1:
1696 if i == -1:
1697 raise PatchError(_("unable to strip away %d of %d dirs from %s") %
1697 raise PatchError(_("unable to strip away %d of %d dirs from %s") %
1698 (count, strip, path))
1698 (count, strip, path))
1699 i += 1
1699 i += 1
1700 # consume '//' in the path
1700 # consume '//' in the path
1701 while i < pathlen - 1 and path[i:i + 1] == '/':
1701 while i < pathlen - 1 and path[i:i + 1] == '/':
1702 i += 1
1702 i += 1
1703 count -= 1
1703 count -= 1
1704 return path[:i].lstrip(), prefix + path[i:].rstrip()
1704 return path[:i].lstrip(), prefix + path[i:].rstrip()
1705
1705
1706 def makepatchmeta(backend, afile_orig, bfile_orig, hunk, strip, prefix):
1706 def makepatchmeta(backend, afile_orig, bfile_orig, hunk, strip, prefix):
1707 nulla = afile_orig == "/dev/null"
1707 nulla = afile_orig == "/dev/null"
1708 nullb = bfile_orig == "/dev/null"
1708 nullb = bfile_orig == "/dev/null"
1709 create = nulla and hunk.starta == 0 and hunk.lena == 0
1709 create = nulla and hunk.starta == 0 and hunk.lena == 0
1710 remove = nullb and hunk.startb == 0 and hunk.lenb == 0
1710 remove = nullb and hunk.startb == 0 and hunk.lenb == 0
1711 abase, afile = pathtransform(afile_orig, strip, prefix)
1711 abase, afile = pathtransform(afile_orig, strip, prefix)
1712 gooda = not nulla and backend.exists(afile)
1712 gooda = not nulla and backend.exists(afile)
1713 bbase, bfile = pathtransform(bfile_orig, strip, prefix)
1713 bbase, bfile = pathtransform(bfile_orig, strip, prefix)
1714 if afile == bfile:
1714 if afile == bfile:
1715 goodb = gooda
1715 goodb = gooda
1716 else:
1716 else:
1717 goodb = not nullb and backend.exists(bfile)
1717 goodb = not nullb and backend.exists(bfile)
1718 missing = not goodb and not gooda and not create
1718 missing = not goodb and not gooda and not create
1719
1719
1720 # some diff programs apparently produce patches where the afile is
1720 # some diff programs apparently produce patches where the afile is
1721 # not /dev/null, but afile starts with bfile
1721 # not /dev/null, but afile starts with bfile
1722 abasedir = afile[:afile.rfind('/') + 1]
1722 abasedir = afile[:afile.rfind('/') + 1]
1723 bbasedir = bfile[:bfile.rfind('/') + 1]
1723 bbasedir = bfile[:bfile.rfind('/') + 1]
1724 if (missing and abasedir == bbasedir and afile.startswith(bfile)
1724 if (missing and abasedir == bbasedir and afile.startswith(bfile)
1725 and hunk.starta == 0 and hunk.lena == 0):
1725 and hunk.starta == 0 and hunk.lena == 0):
1726 create = True
1726 create = True
1727 missing = False
1727 missing = False
1728
1728
1729 # If afile is "a/b/foo" and bfile is "a/b/foo.orig" we assume the
1729 # If afile is "a/b/foo" and bfile is "a/b/foo.orig" we assume the
1730 # diff is between a file and its backup. In this case, the original
1730 # diff is between a file and its backup. In this case, the original
1731 # file should be patched (see original mpatch code).
1731 # file should be patched (see original mpatch code).
1732 isbackup = (abase == bbase and bfile.startswith(afile))
1732 isbackup = (abase == bbase and bfile.startswith(afile))
1733 fname = None
1733 fname = None
1734 if not missing:
1734 if not missing:
1735 if gooda and goodb:
1735 if gooda and goodb:
1736 if isbackup:
1736 if isbackup:
1737 fname = afile
1737 fname = afile
1738 else:
1738 else:
1739 fname = bfile
1739 fname = bfile
1740 elif gooda:
1740 elif gooda:
1741 fname = afile
1741 fname = afile
1742
1742
1743 if not fname:
1743 if not fname:
1744 if not nullb:
1744 if not nullb:
1745 if isbackup:
1745 if isbackup:
1746 fname = afile
1746 fname = afile
1747 else:
1747 else:
1748 fname = bfile
1748 fname = bfile
1749 elif not nulla:
1749 elif not nulla:
1750 fname = afile
1750 fname = afile
1751 else:
1751 else:
1752 raise PatchError(_("undefined source and destination files"))
1752 raise PatchError(_("undefined source and destination files"))
1753
1753
1754 gp = patchmeta(fname)
1754 gp = patchmeta(fname)
1755 if create:
1755 if create:
1756 gp.op = 'ADD'
1756 gp.op = 'ADD'
1757 elif remove:
1757 elif remove:
1758 gp.op = 'DELETE'
1758 gp.op = 'DELETE'
1759 return gp
1759 return gp
1760
1760
1761 def scanpatch(fp):
1761 def scanpatch(fp):
1762 """like patch.iterhunks, but yield different events
1762 """like patch.iterhunks, but yield different events
1763
1763
1764 - ('file', [header_lines + fromfile + tofile])
1764 - ('file', [header_lines + fromfile + tofile])
1765 - ('context', [context_lines])
1765 - ('context', [context_lines])
1766 - ('hunk', [hunk_lines])
1766 - ('hunk', [hunk_lines])
1767 - ('range', (-start,len, +start,len, proc))
1767 - ('range', (-start,len, +start,len, proc))
1768 """
1768 """
1769 lines_re = re.compile(br'@@ -(\d+),(\d+) \+(\d+),(\d+) @@\s*(.*)')
1769 lines_re = re.compile(br'@@ -(\d+),(\d+) \+(\d+),(\d+) @@\s*(.*)')
1770 lr = linereader(fp)
1770 lr = linereader(fp)
1771
1771
1772 def scanwhile(first, p):
1772 def scanwhile(first, p):
1773 """scan lr while predicate holds"""
1773 """scan lr while predicate holds"""
1774 lines = [first]
1774 lines = [first]
1775 for line in iter(lr.readline, ''):
1775 for line in iter(lr.readline, ''):
1776 if p(line):
1776 if p(line):
1777 lines.append(line)
1777 lines.append(line)
1778 else:
1778 else:
1779 lr.push(line)
1779 lr.push(line)
1780 break
1780 break
1781 return lines
1781 return lines
1782
1782
1783 for line in iter(lr.readline, ''):
1783 for line in iter(lr.readline, ''):
1784 if line.startswith('diff --git a/') or line.startswith('diff -r '):
1784 if line.startswith('diff --git a/') or line.startswith('diff -r '):
1785 def notheader(line):
1785 def notheader(line):
1786 s = line.split(None, 1)
1786 s = line.split(None, 1)
1787 return not s or s[0] not in ('---', 'diff')
1787 return not s or s[0] not in ('---', 'diff')
1788 header = scanwhile(line, notheader)
1788 header = scanwhile(line, notheader)
1789 fromfile = lr.readline()
1789 fromfile = lr.readline()
1790 if fromfile.startswith('---'):
1790 if fromfile.startswith('---'):
1791 tofile = lr.readline()
1791 tofile = lr.readline()
1792 header += [fromfile, tofile]
1792 header += [fromfile, tofile]
1793 else:
1793 else:
1794 lr.push(fromfile)
1794 lr.push(fromfile)
1795 yield 'file', header
1795 yield 'file', header
1796 elif line[0:1] == ' ':
1796 elif line[0:1] == ' ':
1797 yield 'context', scanwhile(line, lambda l: l[0] in ' \\')
1797 yield 'context', scanwhile(line, lambda l: l[0] in ' \\')
1798 elif line[0] in '-+':
1798 elif line[0] in '-+':
1799 yield 'hunk', scanwhile(line, lambda l: l[0] in '-+\\')
1799 yield 'hunk', scanwhile(line, lambda l: l[0] in '-+\\')
1800 else:
1800 else:
1801 m = lines_re.match(line)
1801 m = lines_re.match(line)
1802 if m:
1802 if m:
1803 yield 'range', m.groups()
1803 yield 'range', m.groups()
1804 else:
1804 else:
1805 yield 'other', line
1805 yield 'other', line
1806
1806
1807 def scangitpatch(lr, firstline):
1807 def scangitpatch(lr, firstline):
1808 """
1808 """
1809 Git patches can emit:
1809 Git patches can emit:
1810 - rename a to b
1810 - rename a to b
1811 - change b
1811 - change b
1812 - copy a to c
1812 - copy a to c
1813 - change c
1813 - change c
1814
1814
1815 We cannot apply this sequence as-is, the renamed 'a' could not be
1815 We cannot apply this sequence as-is, the renamed 'a' could not be
1816 found for it would have been renamed already. And we cannot copy
1816 found for it would have been renamed already. And we cannot copy
1817 from 'b' instead because 'b' would have been changed already. So
1817 from 'b' instead because 'b' would have been changed already. So
1818 we scan the git patch for copy and rename commands so we can
1818 we scan the git patch for copy and rename commands so we can
1819 perform the copies ahead of time.
1819 perform the copies ahead of time.
1820 """
1820 """
1821 pos = 0
1821 pos = 0
1822 try:
1822 try:
1823 pos = lr.fp.tell()
1823 pos = lr.fp.tell()
1824 fp = lr.fp
1824 fp = lr.fp
1825 except IOError:
1825 except IOError:
1826 fp = stringio(lr.fp.read())
1826 fp = stringio(lr.fp.read())
1827 gitlr = linereader(fp)
1827 gitlr = linereader(fp)
1828 gitlr.push(firstline)
1828 gitlr.push(firstline)
1829 gitpatches = readgitpatch(gitlr)
1829 gitpatches = readgitpatch(gitlr)
1830 fp.seek(pos)
1830 fp.seek(pos)
1831 return gitpatches
1831 return gitpatches
1832
1832
1833 def iterhunks(fp):
1833 def iterhunks(fp):
1834 """Read a patch and yield the following events:
1834 """Read a patch and yield the following events:
1835 - ("file", afile, bfile, firsthunk): select a new target file.
1835 - ("file", afile, bfile, firsthunk): select a new target file.
1836 - ("hunk", hunk): a new hunk is ready to be applied, follows a
1836 - ("hunk", hunk): a new hunk is ready to be applied, follows a
1837 "file" event.
1837 "file" event.
1838 - ("git", gitchanges): current diff is in git format, gitchanges
1838 - ("git", gitchanges): current diff is in git format, gitchanges
1839 maps filenames to gitpatch records. Unique event.
1839 maps filenames to gitpatch records. Unique event.
1840 """
1840 """
1841 afile = ""
1841 afile = ""
1842 bfile = ""
1842 bfile = ""
1843 state = None
1843 state = None
1844 hunknum = 0
1844 hunknum = 0
1845 emitfile = newfile = False
1845 emitfile = newfile = False
1846 gitpatches = None
1846 gitpatches = None
1847
1847
1848 # our states
1848 # our states
1849 BFILE = 1
1849 BFILE = 1
1850 context = None
1850 context = None
1851 lr = linereader(fp)
1851 lr = linereader(fp)
1852
1852
1853 for x in iter(lr.readline, ''):
1853 for x in iter(lr.readline, ''):
1854 if state == BFILE and (
1854 if state == BFILE and (
1855 (not context and x[0] == '@')
1855 (not context and x[0] == '@')
1856 or (context is not False and x.startswith('***************'))
1856 or (context is not False and x.startswith('***************'))
1857 or x.startswith('GIT binary patch')):
1857 or x.startswith('GIT binary patch')):
1858 gp = None
1858 gp = None
1859 if (gitpatches and
1859 if (gitpatches and
1860 gitpatches[-1].ispatching(afile, bfile)):
1860 gitpatches[-1].ispatching(afile, bfile)):
1861 gp = gitpatches.pop()
1861 gp = gitpatches.pop()
1862 if x.startswith('GIT binary patch'):
1862 if x.startswith('GIT binary patch'):
1863 h = binhunk(lr, gp.path)
1863 h = binhunk(lr, gp.path)
1864 else:
1864 else:
1865 if context is None and x.startswith('***************'):
1865 if context is None and x.startswith('***************'):
1866 context = True
1866 context = True
1867 h = hunk(x, hunknum + 1, lr, context)
1867 h = hunk(x, hunknum + 1, lr, context)
1868 hunknum += 1
1868 hunknum += 1
1869 if emitfile:
1869 if emitfile:
1870 emitfile = False
1870 emitfile = False
1871 yield 'file', (afile, bfile, h, gp and gp.copy() or None)
1871 yield 'file', (afile, bfile, h, gp and gp.copy() or None)
1872 yield 'hunk', h
1872 yield 'hunk', h
1873 elif x.startswith('diff --git a/'):
1873 elif x.startswith('diff --git a/'):
1874 m = gitre.match(x.rstrip(' \r\n'))
1874 m = gitre.match(x.rstrip(' \r\n'))
1875 if not m:
1875 if not m:
1876 continue
1876 continue
1877 if gitpatches is None:
1877 if gitpatches is None:
1878 # scan whole input for git metadata
1878 # scan whole input for git metadata
1879 gitpatches = scangitpatch(lr, x)
1879 gitpatches = scangitpatch(lr, x)
1880 yield 'git', [g.copy() for g in gitpatches
1880 yield 'git', [g.copy() for g in gitpatches
1881 if g.op in ('COPY', 'RENAME')]
1881 if g.op in ('COPY', 'RENAME')]
1882 gitpatches.reverse()
1882 gitpatches.reverse()
1883 afile = 'a/' + m.group(1)
1883 afile = 'a/' + m.group(1)
1884 bfile = 'b/' + m.group(2)
1884 bfile = 'b/' + m.group(2)
1885 while gitpatches and not gitpatches[-1].ispatching(afile, bfile):
1885 while gitpatches and not gitpatches[-1].ispatching(afile, bfile):
1886 gp = gitpatches.pop()
1886 gp = gitpatches.pop()
1887 yield 'file', ('a/' + gp.path, 'b/' + gp.path, None, gp.copy())
1887 yield 'file', ('a/' + gp.path, 'b/' + gp.path, None, gp.copy())
1888 if not gitpatches:
1888 if not gitpatches:
1889 raise PatchError(_('failed to synchronize metadata for "%s"')
1889 raise PatchError(_('failed to synchronize metadata for "%s"')
1890 % afile[2:])
1890 % afile[2:])
1891 gp = gitpatches[-1]
1891 gp = gitpatches[-1]
1892 newfile = True
1892 newfile = True
1893 elif x.startswith('---'):
1893 elif x.startswith('---'):
1894 # check for a unified diff
1894 # check for a unified diff
1895 l2 = lr.readline()
1895 l2 = lr.readline()
1896 if not l2.startswith('+++'):
1896 if not l2.startswith('+++'):
1897 lr.push(l2)
1897 lr.push(l2)
1898 continue
1898 continue
1899 newfile = True
1899 newfile = True
1900 context = False
1900 context = False
1901 afile = parsefilename(x)
1901 afile = parsefilename(x)
1902 bfile = parsefilename(l2)
1902 bfile = parsefilename(l2)
1903 elif x.startswith('***'):
1903 elif x.startswith('***'):
1904 # check for a context diff
1904 # check for a context diff
1905 l2 = lr.readline()
1905 l2 = lr.readline()
1906 if not l2.startswith('---'):
1906 if not l2.startswith('---'):
1907 lr.push(l2)
1907 lr.push(l2)
1908 continue
1908 continue
1909 l3 = lr.readline()
1909 l3 = lr.readline()
1910 lr.push(l3)
1910 lr.push(l3)
1911 if not l3.startswith("***************"):
1911 if not l3.startswith("***************"):
1912 lr.push(l2)
1912 lr.push(l2)
1913 continue
1913 continue
1914 newfile = True
1914 newfile = True
1915 context = True
1915 context = True
1916 afile = parsefilename(x)
1916 afile = parsefilename(x)
1917 bfile = parsefilename(l2)
1917 bfile = parsefilename(l2)
1918
1918
1919 if newfile:
1919 if newfile:
1920 newfile = False
1920 newfile = False
1921 emitfile = True
1921 emitfile = True
1922 state = BFILE
1922 state = BFILE
1923 hunknum = 0
1923 hunknum = 0
1924
1924
1925 while gitpatches:
1925 while gitpatches:
1926 gp = gitpatches.pop()
1926 gp = gitpatches.pop()
1927 yield 'file', ('a/' + gp.path, 'b/' + gp.path, None, gp.copy())
1927 yield 'file', ('a/' + gp.path, 'b/' + gp.path, None, gp.copy())
1928
1928
1929 def applybindelta(binchunk, data):
1929 def applybindelta(binchunk, data):
1930 """Apply a binary delta hunk
1930 """Apply a binary delta hunk
1931 The algorithm used is the algorithm from git's patch-delta.c
1931 The algorithm used is the algorithm from git's patch-delta.c
1932 """
1932 """
1933 def deltahead(binchunk):
1933 def deltahead(binchunk):
1934 i = 0
1934 i = 0
1935 for c in binchunk:
1935 for c in binchunk:
1936 i += 1
1936 i += 1
1937 if not (ord(c) & 0x80):
1937 if not (ord(c) & 0x80):
1938 return i
1938 return i
1939 return i
1939 return i
1940 out = ""
1940 out = ""
1941 s = deltahead(binchunk)
1941 s = deltahead(binchunk)
1942 binchunk = binchunk[s:]
1942 binchunk = binchunk[s:]
1943 s = deltahead(binchunk)
1943 s = deltahead(binchunk)
1944 binchunk = binchunk[s:]
1944 binchunk = binchunk[s:]
1945 i = 0
1945 i = 0
1946 while i < len(binchunk):
1946 while i < len(binchunk):
1947 cmd = ord(binchunk[i])
1947 cmd = ord(binchunk[i])
1948 i += 1
1948 i += 1
1949 if (cmd & 0x80):
1949 if (cmd & 0x80):
1950 offset = 0
1950 offset = 0
1951 size = 0
1951 size = 0
1952 if (cmd & 0x01):
1952 if (cmd & 0x01):
1953 offset = ord(binchunk[i])
1953 offset = ord(binchunk[i])
1954 i += 1
1954 i += 1
1955 if (cmd & 0x02):
1955 if (cmd & 0x02):
1956 offset |= ord(binchunk[i]) << 8
1956 offset |= ord(binchunk[i]) << 8
1957 i += 1
1957 i += 1
1958 if (cmd & 0x04):
1958 if (cmd & 0x04):
1959 offset |= ord(binchunk[i]) << 16
1959 offset |= ord(binchunk[i]) << 16
1960 i += 1
1960 i += 1
1961 if (cmd & 0x08):
1961 if (cmd & 0x08):
1962 offset |= ord(binchunk[i]) << 24
1962 offset |= ord(binchunk[i]) << 24
1963 i += 1
1963 i += 1
1964 if (cmd & 0x10):
1964 if (cmd & 0x10):
1965 size = ord(binchunk[i])
1965 size = ord(binchunk[i])
1966 i += 1
1966 i += 1
1967 if (cmd & 0x20):
1967 if (cmd & 0x20):
1968 size |= ord(binchunk[i]) << 8
1968 size |= ord(binchunk[i]) << 8
1969 i += 1
1969 i += 1
1970 if (cmd & 0x40):
1970 if (cmd & 0x40):
1971 size |= ord(binchunk[i]) << 16
1971 size |= ord(binchunk[i]) << 16
1972 i += 1
1972 i += 1
1973 if size == 0:
1973 if size == 0:
1974 size = 0x10000
1974 size = 0x10000
1975 offset_end = offset + size
1975 offset_end = offset + size
1976 out += data[offset:offset_end]
1976 out += data[offset:offset_end]
1977 elif cmd != 0:
1977 elif cmd != 0:
1978 offset_end = i + cmd
1978 offset_end = i + cmd
1979 out += binchunk[i:offset_end]
1979 out += binchunk[i:offset_end]
1980 i += cmd
1980 i += cmd
1981 else:
1981 else:
1982 raise PatchError(_('unexpected delta opcode 0'))
1982 raise PatchError(_('unexpected delta opcode 0'))
1983 return out
1983 return out
1984
1984
1985 def applydiff(ui, fp, backend, store, strip=1, prefix='', eolmode='strict'):
1985 def applydiff(ui, fp, backend, store, strip=1, prefix='', eolmode='strict'):
1986 """Reads a patch from fp and tries to apply it.
1986 """Reads a patch from fp and tries to apply it.
1987
1987
1988 Returns 0 for a clean patch, -1 if any rejects were found and 1 if
1988 Returns 0 for a clean patch, -1 if any rejects were found and 1 if
1989 there was any fuzz.
1989 there was any fuzz.
1990
1990
1991 If 'eolmode' is 'strict', the patch content and patched file are
1991 If 'eolmode' is 'strict', the patch content and patched file are
1992 read in binary mode. Otherwise, line endings are ignored when
1992 read in binary mode. Otherwise, line endings are ignored when
1993 patching then normalized according to 'eolmode'.
1993 patching then normalized according to 'eolmode'.
1994 """
1994 """
1995 return _applydiff(ui, fp, patchfile, backend, store, strip=strip,
1995 return _applydiff(ui, fp, patchfile, backend, store, strip=strip,
1996 prefix=prefix, eolmode=eolmode)
1996 prefix=prefix, eolmode=eolmode)
1997
1997
1998 def _canonprefix(repo, prefix):
1998 def _canonprefix(repo, prefix):
1999 if prefix:
1999 if prefix:
2000 prefix = pathutil.canonpath(repo.root, repo.getcwd(), prefix)
2000 prefix = pathutil.canonpath(repo.root, repo.getcwd(), prefix)
2001 if prefix != '':
2001 if prefix != '':
2002 prefix += '/'
2002 prefix += '/'
2003 return prefix
2003 return prefix
2004
2004
2005 def _applydiff(ui, fp, patcher, backend, store, strip=1, prefix='',
2005 def _applydiff(ui, fp, patcher, backend, store, strip=1, prefix='',
2006 eolmode='strict'):
2006 eolmode='strict'):
2007 prefix = _canonprefix(backend.repo, prefix)
2007 prefix = _canonprefix(backend.repo, prefix)
2008 def pstrip(p):
2008 def pstrip(p):
2009 return pathtransform(p, strip - 1, prefix)[1]
2009 return pathtransform(p, strip - 1, prefix)[1]
2010
2010
2011 rejects = 0
2011 rejects = 0
2012 err = 0
2012 err = 0
2013 current_file = None
2013 current_file = None
2014
2014
2015 for state, values in iterhunks(fp):
2015 for state, values in iterhunks(fp):
2016 if state == 'hunk':
2016 if state == 'hunk':
2017 if not current_file:
2017 if not current_file:
2018 continue
2018 continue
2019 ret = current_file.apply(values)
2019 ret = current_file.apply(values)
2020 if ret > 0:
2020 if ret > 0:
2021 err = 1
2021 err = 1
2022 elif state == 'file':
2022 elif state == 'file':
2023 if current_file:
2023 if current_file:
2024 rejects += current_file.close()
2024 rejects += current_file.close()
2025 current_file = None
2025 current_file = None
2026 afile, bfile, first_hunk, gp = values
2026 afile, bfile, first_hunk, gp = values
2027 if gp:
2027 if gp:
2028 gp.path = pstrip(gp.path)
2028 gp.path = pstrip(gp.path)
2029 if gp.oldpath:
2029 if gp.oldpath:
2030 gp.oldpath = pstrip(gp.oldpath)
2030 gp.oldpath = pstrip(gp.oldpath)
2031 else:
2031 else:
2032 gp = makepatchmeta(backend, afile, bfile, first_hunk, strip,
2032 gp = makepatchmeta(backend, afile, bfile, first_hunk, strip,
2033 prefix)
2033 prefix)
2034 if gp.op == 'RENAME':
2034 if gp.op == 'RENAME':
2035 backend.unlink(gp.oldpath)
2035 backend.unlink(gp.oldpath)
2036 if not first_hunk:
2036 if not first_hunk:
2037 if gp.op == 'DELETE':
2037 if gp.op == 'DELETE':
2038 backend.unlink(gp.path)
2038 backend.unlink(gp.path)
2039 continue
2039 continue
2040 data, mode = None, None
2040 data, mode = None, None
2041 if gp.op in ('RENAME', 'COPY'):
2041 if gp.op in ('RENAME', 'COPY'):
2042 data, mode = store.getfile(gp.oldpath)[:2]
2042 data, mode = store.getfile(gp.oldpath)[:2]
2043 if data is None:
2043 if data is None:
2044 # This means that the old path does not exist
2044 # This means that the old path does not exist
2045 raise PatchError(_("source file '%s' does not exist")
2045 raise PatchError(_("source file '%s' does not exist")
2046 % gp.oldpath)
2046 % gp.oldpath)
2047 if gp.mode:
2047 if gp.mode:
2048 mode = gp.mode
2048 mode = gp.mode
2049 if gp.op == 'ADD':
2049 if gp.op == 'ADD':
2050 # Added files without content have no hunk and
2050 # Added files without content have no hunk and
2051 # must be created
2051 # must be created
2052 data = ''
2052 data = ''
2053 if data or mode:
2053 if data or mode:
2054 if (gp.op in ('ADD', 'RENAME', 'COPY')
2054 if (gp.op in ('ADD', 'RENAME', 'COPY')
2055 and backend.exists(gp.path)):
2055 and backend.exists(gp.path)):
2056 raise PatchError(_("cannot create %s: destination "
2056 raise PatchError(_("cannot create %s: destination "
2057 "already exists") % gp.path)
2057 "already exists") % gp.path)
2058 backend.setfile(gp.path, data, mode, gp.oldpath)
2058 backend.setfile(gp.path, data, mode, gp.oldpath)
2059 continue
2059 continue
2060 try:
2060 try:
2061 current_file = patcher(ui, gp, backend, store,
2061 current_file = patcher(ui, gp, backend, store,
2062 eolmode=eolmode)
2062 eolmode=eolmode)
2063 except PatchError as inst:
2063 except PatchError as inst:
2064 ui.warn(str(inst) + '\n')
2064 ui.warn(str(inst) + '\n')
2065 current_file = None
2065 current_file = None
2066 rejects += 1
2066 rejects += 1
2067 continue
2067 continue
2068 elif state == 'git':
2068 elif state == 'git':
2069 for gp in values:
2069 for gp in values:
2070 path = pstrip(gp.oldpath)
2070 path = pstrip(gp.oldpath)
2071 data, mode = backend.getfile(path)
2071 data, mode = backend.getfile(path)
2072 if data is None:
2072 if data is None:
2073 # The error ignored here will trigger a getfile()
2073 # The error ignored here will trigger a getfile()
2074 # error in a place more appropriate for error
2074 # error in a place more appropriate for error
2075 # handling, and will not interrupt the patching
2075 # handling, and will not interrupt the patching
2076 # process.
2076 # process.
2077 pass
2077 pass
2078 else:
2078 else:
2079 store.setfile(path, data, mode)
2079 store.setfile(path, data, mode)
2080 else:
2080 else:
2081 raise error.Abort(_('unsupported parser state: %s') % state)
2081 raise error.Abort(_('unsupported parser state: %s') % state)
2082
2082
2083 if current_file:
2083 if current_file:
2084 rejects += current_file.close()
2084 rejects += current_file.close()
2085
2085
2086 if rejects:
2086 if rejects:
2087 return -1
2087 return -1
2088 return err
2088 return err
2089
2089
2090 def _externalpatch(ui, repo, patcher, patchname, strip, files,
2090 def _externalpatch(ui, repo, patcher, patchname, strip, files,
2091 similarity):
2091 similarity):
2092 """use <patcher> to apply <patchname> to the working directory.
2092 """use <patcher> to apply <patchname> to the working directory.
2093 returns whether patch was applied with fuzz factor."""
2093 returns whether patch was applied with fuzz factor."""
2094
2094
2095 fuzz = False
2095 fuzz = False
2096 args = []
2096 args = []
2097 cwd = repo.root
2097 cwd = repo.root
2098 if cwd:
2098 if cwd:
2099 args.append('-d %s' % util.shellquote(cwd))
2099 args.append('-d %s' % util.shellquote(cwd))
2100 fp = util.popen('%s %s -p%d < %s' % (patcher, ' '.join(args), strip,
2100 fp = util.popen('%s %s -p%d < %s' % (patcher, ' '.join(args), strip,
2101 util.shellquote(patchname)))
2101 util.shellquote(patchname)))
2102 try:
2102 try:
2103 for line in util.iterfile(fp):
2103 for line in util.iterfile(fp):
2104 line = line.rstrip()
2104 line = line.rstrip()
2105 ui.note(line + '\n')
2105 ui.note(line + '\n')
2106 if line.startswith('patching file '):
2106 if line.startswith('patching file '):
2107 pf = util.parsepatchoutput(line)
2107 pf = util.parsepatchoutput(line)
2108 printed_file = False
2108 printed_file = False
2109 files.add(pf)
2109 files.add(pf)
2110 elif line.find('with fuzz') >= 0:
2110 elif line.find('with fuzz') >= 0:
2111 fuzz = True
2111 fuzz = True
2112 if not printed_file:
2112 if not printed_file:
2113 ui.warn(pf + '\n')
2113 ui.warn(pf + '\n')
2114 printed_file = True
2114 printed_file = True
2115 ui.warn(line + '\n')
2115 ui.warn(line + '\n')
2116 elif line.find('saving rejects to file') >= 0:
2116 elif line.find('saving rejects to file') >= 0:
2117 ui.warn(line + '\n')
2117 ui.warn(line + '\n')
2118 elif line.find('FAILED') >= 0:
2118 elif line.find('FAILED') >= 0:
2119 if not printed_file:
2119 if not printed_file:
2120 ui.warn(pf + '\n')
2120 ui.warn(pf + '\n')
2121 printed_file = True
2121 printed_file = True
2122 ui.warn(line + '\n')
2122 ui.warn(line + '\n')
2123 finally:
2123 finally:
2124 if files:
2124 if files:
2125 scmutil.marktouched(repo, files, similarity)
2125 scmutil.marktouched(repo, files, similarity)
2126 code = fp.close()
2126 code = fp.close()
2127 if code:
2127 if code:
2128 raise PatchError(_("patch command failed: %s") %
2128 raise PatchError(_("patch command failed: %s") %
2129 util.explainexit(code)[0])
2129 util.explainexit(code)[0])
2130 return fuzz
2130 return fuzz
2131
2131
2132 def patchbackend(ui, backend, patchobj, strip, prefix, files=None,
2132 def patchbackend(ui, backend, patchobj, strip, prefix, files=None,
2133 eolmode='strict'):
2133 eolmode='strict'):
2134 if files is None:
2134 if files is None:
2135 files = set()
2135 files = set()
2136 if eolmode is None:
2136 if eolmode is None:
2137 eolmode = ui.config('patch', 'eol')
2137 eolmode = ui.config('patch', 'eol')
2138 if eolmode.lower() not in eolmodes:
2138 if eolmode.lower() not in eolmodes:
2139 raise error.Abort(_('unsupported line endings type: %s') % eolmode)
2139 raise error.Abort(_('unsupported line endings type: %s') % eolmode)
2140 eolmode = eolmode.lower()
2140 eolmode = eolmode.lower()
2141
2141
2142 store = filestore()
2142 store = filestore()
2143 try:
2143 try:
2144 fp = open(patchobj, 'rb')
2144 fp = open(patchobj, 'rb')
2145 except TypeError:
2145 except TypeError:
2146 fp = patchobj
2146 fp = patchobj
2147 try:
2147 try:
2148 ret = applydiff(ui, fp, backend, store, strip=strip, prefix=prefix,
2148 ret = applydiff(ui, fp, backend, store, strip=strip, prefix=prefix,
2149 eolmode=eolmode)
2149 eolmode=eolmode)
2150 finally:
2150 finally:
2151 if fp != patchobj:
2151 if fp != patchobj:
2152 fp.close()
2152 fp.close()
2153 files.update(backend.close())
2153 files.update(backend.close())
2154 store.close()
2154 store.close()
2155 if ret < 0:
2155 if ret < 0:
2156 raise PatchError(_('patch failed to apply'))
2156 raise PatchError(_('patch failed to apply'))
2157 return ret > 0
2157 return ret > 0
2158
2158
2159 def internalpatch(ui, repo, patchobj, strip, prefix='', files=None,
2159 def internalpatch(ui, repo, patchobj, strip, prefix='', files=None,
2160 eolmode='strict', similarity=0):
2160 eolmode='strict', similarity=0):
2161 """use builtin patch to apply <patchobj> to the working directory.
2161 """use builtin patch to apply <patchobj> to the working directory.
2162 returns whether patch was applied with fuzz factor."""
2162 returns whether patch was applied with fuzz factor."""
2163 backend = workingbackend(ui, repo, similarity)
2163 backend = workingbackend(ui, repo, similarity)
2164 return patchbackend(ui, backend, patchobj, strip, prefix, files, eolmode)
2164 return patchbackend(ui, backend, patchobj, strip, prefix, files, eolmode)
2165
2165
2166 def patchrepo(ui, repo, ctx, store, patchobj, strip, prefix, files=None,
2166 def patchrepo(ui, repo, ctx, store, patchobj, strip, prefix, files=None,
2167 eolmode='strict'):
2167 eolmode='strict'):
2168 backend = repobackend(ui, repo, ctx, store)
2168 backend = repobackend(ui, repo, ctx, store)
2169 return patchbackend(ui, backend, patchobj, strip, prefix, files, eolmode)
2169 return patchbackend(ui, backend, patchobj, strip, prefix, files, eolmode)
2170
2170
2171 def patch(ui, repo, patchname, strip=1, prefix='', files=None, eolmode='strict',
2171 def patch(ui, repo, patchname, strip=1, prefix='', files=None, eolmode='strict',
2172 similarity=0):
2172 similarity=0):
2173 """Apply <patchname> to the working directory.
2173 """Apply <patchname> to the working directory.
2174
2174
2175 'eolmode' specifies how end of lines should be handled. It can be:
2175 'eolmode' specifies how end of lines should be handled. It can be:
2176 - 'strict': inputs are read in binary mode, EOLs are preserved
2176 - 'strict': inputs are read in binary mode, EOLs are preserved
2177 - 'crlf': EOLs are ignored when patching and reset to CRLF
2177 - 'crlf': EOLs are ignored when patching and reset to CRLF
2178 - 'lf': EOLs are ignored when patching and reset to LF
2178 - 'lf': EOLs are ignored when patching and reset to LF
2179 - None: get it from user settings, default to 'strict'
2179 - None: get it from user settings, default to 'strict'
2180 'eolmode' is ignored when using an external patcher program.
2180 'eolmode' is ignored when using an external patcher program.
2181
2181
2182 Returns whether patch was applied with fuzz factor.
2182 Returns whether patch was applied with fuzz factor.
2183 """
2183 """
2184 patcher = ui.config('ui', 'patch')
2184 patcher = ui.config('ui', 'patch')
2185 if files is None:
2185 if files is None:
2186 files = set()
2186 files = set()
2187 if patcher:
2187 if patcher:
2188 return _externalpatch(ui, repo, patcher, patchname, strip,
2188 return _externalpatch(ui, repo, patcher, patchname, strip,
2189 files, similarity)
2189 files, similarity)
2190 return internalpatch(ui, repo, patchname, strip, prefix, files, eolmode,
2190 return internalpatch(ui, repo, patchname, strip, prefix, files, eolmode,
2191 similarity)
2191 similarity)
2192
2192
2193 def changedfiles(ui, repo, patchpath, strip=1, prefix=''):
2193 def changedfiles(ui, repo, patchpath, strip=1, prefix=''):
2194 backend = fsbackend(ui, repo.root)
2194 backend = fsbackend(ui, repo.root)
2195 prefix = _canonprefix(repo, prefix)
2195 prefix = _canonprefix(repo, prefix)
2196 with open(patchpath, 'rb') as fp:
2196 with open(patchpath, 'rb') as fp:
2197 changed = set()
2197 changed = set()
2198 for state, values in iterhunks(fp):
2198 for state, values in iterhunks(fp):
2199 if state == 'file':
2199 if state == 'file':
2200 afile, bfile, first_hunk, gp = values
2200 afile, bfile, first_hunk, gp = values
2201 if gp:
2201 if gp:
2202 gp.path = pathtransform(gp.path, strip - 1, prefix)[1]
2202 gp.path = pathtransform(gp.path, strip - 1, prefix)[1]
2203 if gp.oldpath:
2203 if gp.oldpath:
2204 gp.oldpath = pathtransform(gp.oldpath, strip - 1,
2204 gp.oldpath = pathtransform(gp.oldpath, strip - 1,
2205 prefix)[1]
2205 prefix)[1]
2206 else:
2206 else:
2207 gp = makepatchmeta(backend, afile, bfile, first_hunk, strip,
2207 gp = makepatchmeta(backend, afile, bfile, first_hunk, strip,
2208 prefix)
2208 prefix)
2209 changed.add(gp.path)
2209 changed.add(gp.path)
2210 if gp.op == 'RENAME':
2210 if gp.op == 'RENAME':
2211 changed.add(gp.oldpath)
2211 changed.add(gp.oldpath)
2212 elif state not in ('hunk', 'git'):
2212 elif state not in ('hunk', 'git'):
2213 raise error.Abort(_('unsupported parser state: %s') % state)
2213 raise error.Abort(_('unsupported parser state: %s') % state)
2214 return changed
2214 return changed
2215
2215
2216 class GitDiffRequired(Exception):
2216 class GitDiffRequired(Exception):
2217 pass
2217 pass
2218
2218
2219 def diffallopts(ui, opts=None, untrusted=False, section='diff'):
2219 def diffallopts(ui, opts=None, untrusted=False, section='diff'):
2220 '''return diffopts with all features supported and parsed'''
2220 '''return diffopts with all features supported and parsed'''
2221 return difffeatureopts(ui, opts=opts, untrusted=untrusted, section=section,
2221 return difffeatureopts(ui, opts=opts, untrusted=untrusted, section=section,
2222 git=True, whitespace=True, formatchanging=True)
2222 git=True, whitespace=True, formatchanging=True)
2223
2223
2224 diffopts = diffallopts
2224 diffopts = diffallopts
2225
2225
2226 def difffeatureopts(ui, opts=None, untrusted=False, section='diff', git=False,
2226 def difffeatureopts(ui, opts=None, untrusted=False, section='diff', git=False,
2227 whitespace=False, formatchanging=False):
2227 whitespace=False, formatchanging=False):
2228 '''return diffopts with only opted-in features parsed
2228 '''return diffopts with only opted-in features parsed
2229
2229
2230 Features:
2230 Features:
2231 - git: git-style diffs
2231 - git: git-style diffs
2232 - whitespace: whitespace options like ignoreblanklines and ignorews
2232 - whitespace: whitespace options like ignoreblanklines and ignorews
2233 - formatchanging: options that will likely break or cause correctness issues
2233 - formatchanging: options that will likely break or cause correctness issues
2234 with most diff parsers
2234 with most diff parsers
2235 '''
2235 '''
2236 def get(key, name=None, getter=ui.configbool, forceplain=None):
2236 def get(key, name=None, getter=ui.configbool, forceplain=None):
2237 if opts:
2237 if opts:
2238 v = opts.get(key)
2238 v = opts.get(key)
2239 # diffopts flags are either None-default (which is passed
2239 # diffopts flags are either None-default (which is passed
2240 # through unchanged, so we can identify unset values), or
2240 # through unchanged, so we can identify unset values), or
2241 # some other falsey default (eg --unified, which defaults
2241 # some other falsey default (eg --unified, which defaults
2242 # to an empty string). We only want to override the config
2242 # to an empty string). We only want to override the config
2243 # entries from hgrc with command line values if they
2243 # entries from hgrc with command line values if they
2244 # appear to have been set, which is any truthy value,
2244 # appear to have been set, which is any truthy value,
2245 # True, or False.
2245 # True, or False.
2246 if v or isinstance(v, bool):
2246 if v or isinstance(v, bool):
2247 return v
2247 return v
2248 if forceplain is not None and ui.plain():
2248 if forceplain is not None and ui.plain():
2249 return forceplain
2249 return forceplain
2250 return getter(section, name or key, untrusted=untrusted)
2250 return getter(section, name or key, untrusted=untrusted)
2251
2251
2252 # core options, expected to be understood by every diff parser
2252 # core options, expected to be understood by every diff parser
2253 buildopts = {
2253 buildopts = {
2254 'nodates': get('nodates'),
2254 'nodates': get('nodates'),
2255 'showfunc': get('show_function', 'showfunc'),
2255 'showfunc': get('show_function', 'showfunc'),
2256 'context': get('unified', getter=ui.config),
2256 'context': get('unified', getter=ui.config),
2257 }
2257 }
2258 buildopts['worddiff'] = ui.configbool('experimental', 'worddiff')
2258 buildopts['worddiff'] = ui.configbool('experimental', 'worddiff')
2259
2259
2260 if git:
2260 if git:
2261 buildopts['git'] = get('git')
2261 buildopts['git'] = get('git')
2262
2262
2263 # since this is in the experimental section, we need to call
2263 # since this is in the experimental section, we need to call
2264 # ui.configbool directory
2264 # ui.configbool directory
2265 buildopts['showsimilarity'] = ui.configbool('experimental',
2265 buildopts['showsimilarity'] = ui.configbool('experimental',
2266 'extendedheader.similarity')
2266 'extendedheader.similarity')
2267
2267
2268 # need to inspect the ui object instead of using get() since we want to
2268 # need to inspect the ui object instead of using get() since we want to
2269 # test for an int
2269 # test for an int
2270 hconf = ui.config('experimental', 'extendedheader.index')
2270 hconf = ui.config('experimental', 'extendedheader.index')
2271 if hconf is not None:
2271 if hconf is not None:
2272 hlen = None
2272 hlen = None
2273 try:
2273 try:
2274 # the hash config could be an integer (for length of hash) or a
2274 # the hash config could be an integer (for length of hash) or a
2275 # word (e.g. short, full, none)
2275 # word (e.g. short, full, none)
2276 hlen = int(hconf)
2276 hlen = int(hconf)
2277 if hlen < 0 or hlen > 40:
2277 if hlen < 0 or hlen > 40:
2278 msg = _("invalid length for extendedheader.index: '%d'\n")
2278 msg = _("invalid length for extendedheader.index: '%d'\n")
2279 ui.warn(msg % hlen)
2279 ui.warn(msg % hlen)
2280 except ValueError:
2280 except ValueError:
2281 # default value
2281 # default value
2282 if hconf == 'short' or hconf == '':
2282 if hconf == 'short' or hconf == '':
2283 hlen = 12
2283 hlen = 12
2284 elif hconf == 'full':
2284 elif hconf == 'full':
2285 hlen = 40
2285 hlen = 40
2286 elif hconf != 'none':
2286 elif hconf != 'none':
2287 msg = _("invalid value for extendedheader.index: '%s'\n")
2287 msg = _("invalid value for extendedheader.index: '%s'\n")
2288 ui.warn(msg % hconf)
2288 ui.warn(msg % hconf)
2289 finally:
2289 finally:
2290 buildopts['index'] = hlen
2290 buildopts['index'] = hlen
2291
2291
2292 if whitespace:
2292 if whitespace:
2293 buildopts['ignorews'] = get('ignore_all_space', 'ignorews')
2293 buildopts['ignorews'] = get('ignore_all_space', 'ignorews')
2294 buildopts['ignorewsamount'] = get('ignore_space_change',
2294 buildopts['ignorewsamount'] = get('ignore_space_change',
2295 'ignorewsamount')
2295 'ignorewsamount')
2296 buildopts['ignoreblanklines'] = get('ignore_blank_lines',
2296 buildopts['ignoreblanklines'] = get('ignore_blank_lines',
2297 'ignoreblanklines')
2297 'ignoreblanklines')
2298 buildopts['ignorewseol'] = get('ignore_space_at_eol', 'ignorewseol')
2298 buildopts['ignorewseol'] = get('ignore_space_at_eol', 'ignorewseol')
2299 if formatchanging:
2299 if formatchanging:
2300 buildopts['text'] = opts and opts.get('text')
2300 buildopts['text'] = opts and opts.get('text')
2301 binary = None if opts is None else opts.get('binary')
2301 binary = None if opts is None else opts.get('binary')
2302 buildopts['nobinary'] = (not binary if binary is not None
2302 buildopts['nobinary'] = (not binary if binary is not None
2303 else get('nobinary', forceplain=False))
2303 else get('nobinary', forceplain=False))
2304 buildopts['noprefix'] = get('noprefix', forceplain=False)
2304 buildopts['noprefix'] = get('noprefix', forceplain=False)
2305
2305
2306 return mdiff.diffopts(**pycompat.strkwargs(buildopts))
2306 return mdiff.diffopts(**pycompat.strkwargs(buildopts))
2307
2307
2308 def diff(repo, node1=None, node2=None, match=None, changes=None,
2308 def diff(repo, node1=None, node2=None, match=None, changes=None,
2309 opts=None, losedatafn=None, prefix='', relroot='', copy=None,
2309 opts=None, losedatafn=None, prefix='', relroot='', copy=None,
2310 hunksfilterfn=None):
2310 hunksfilterfn=None):
2311 '''yields diff of changes to files between two nodes, or node and
2311 '''yields diff of changes to files between two nodes, or node and
2312 working directory.
2312 working directory.
2313
2313
2314 if node1 is None, use first dirstate parent instead.
2314 if node1 is None, use first dirstate parent instead.
2315 if node2 is None, compare node1 with working directory.
2315 if node2 is None, compare node1 with working directory.
2316
2316
2317 losedatafn(**kwarg) is a callable run when opts.upgrade=True and
2317 losedatafn(**kwarg) is a callable run when opts.upgrade=True and
2318 every time some change cannot be represented with the current
2318 every time some change cannot be represented with the current
2319 patch format. Return False to upgrade to git patch format, True to
2319 patch format. Return False to upgrade to git patch format, True to
2320 accept the loss or raise an exception to abort the diff. It is
2320 accept the loss or raise an exception to abort the diff. It is
2321 called with the name of current file being diffed as 'fn'. If set
2321 called with the name of current file being diffed as 'fn'. If set
2322 to None, patches will always be upgraded to git format when
2322 to None, patches will always be upgraded to git format when
2323 necessary.
2323 necessary.
2324
2324
2325 prefix is a filename prefix that is prepended to all filenames on
2325 prefix is a filename prefix that is prepended to all filenames on
2326 display (used for subrepos).
2326 display (used for subrepos).
2327
2327
2328 relroot, if not empty, must be normalized with a trailing /. Any match
2328 relroot, if not empty, must be normalized with a trailing /. Any match
2329 patterns that fall outside it will be ignored.
2329 patterns that fall outside it will be ignored.
2330
2330
2331 copy, if not empty, should contain mappings {dst@y: src@x} of copy
2331 copy, if not empty, should contain mappings {dst@y: src@x} of copy
2332 information.
2332 information.
2333
2333
2334 hunksfilterfn, if not None, should be a function taking a filectx and
2334 hunksfilterfn, if not None, should be a function taking a filectx and
2335 hunks generator that may yield filtered hunks.
2335 hunks generator that may yield filtered hunks.
2336 '''
2336 '''
2337 for fctx1, fctx2, hdr, hunks in diffhunks(
2337 for fctx1, fctx2, hdr, hunks in diffhunks(
2338 repo, node1=node1, node2=node2,
2338 repo, node1=node1, node2=node2,
2339 match=match, changes=changes, opts=opts,
2339 match=match, changes=changes, opts=opts,
2340 losedatafn=losedatafn, prefix=prefix, relroot=relroot, copy=copy,
2340 losedatafn=losedatafn, prefix=prefix, relroot=relroot, copy=copy,
2341 ):
2341 ):
2342 if hunksfilterfn is not None:
2342 if hunksfilterfn is not None:
2343 # If the file has been removed, fctx2 is None; but this should
2343 # If the file has been removed, fctx2 is None; but this should
2344 # not occur here since we catch removed files early in
2344 # not occur here since we catch removed files early in
2345 # cmdutil.getloglinerangerevs() for 'hg log -L'.
2345 # cmdutil.getloglinerangerevs() for 'hg log -L'.
2346 assert fctx2 is not None, \
2346 assert fctx2 is not None, \
2347 'fctx2 unexpectly None in diff hunks filtering'
2347 'fctx2 unexpectly None in diff hunks filtering'
2348 hunks = hunksfilterfn(fctx2, hunks)
2348 hunks = hunksfilterfn(fctx2, hunks)
2349 text = ''.join(sum((list(hlines) for hrange, hlines in hunks), []))
2349 text = ''.join(sum((list(hlines) for hrange, hlines in hunks), []))
2350 if hdr and (text or len(hdr) > 1):
2350 if hdr and (text or len(hdr) > 1):
2351 yield '\n'.join(hdr) + '\n'
2351 yield '\n'.join(hdr) + '\n'
2352 if text:
2352 if text:
2353 yield text
2353 yield text
2354
2354
2355 def diffhunks(repo, node1=None, node2=None, match=None, changes=None,
2355 def diffhunks(repo, node1=None, node2=None, match=None, changes=None,
2356 opts=None, losedatafn=None, prefix='', relroot='', copy=None):
2356 opts=None, losedatafn=None, prefix='', relroot='', copy=None):
2357 """Yield diff of changes to files in the form of (`header`, `hunks`) tuples
2357 """Yield diff of changes to files in the form of (`header`, `hunks`) tuples
2358 where `header` is a list of diff headers and `hunks` is an iterable of
2358 where `header` is a list of diff headers and `hunks` is an iterable of
2359 (`hunkrange`, `hunklines`) tuples.
2359 (`hunkrange`, `hunklines`) tuples.
2360
2360
2361 See diff() for the meaning of parameters.
2361 See diff() for the meaning of parameters.
2362 """
2362 """
2363
2363
2364 if opts is None:
2364 if opts is None:
2365 opts = mdiff.defaultopts
2365 opts = mdiff.defaultopts
2366
2366
2367 if not node1 and not node2:
2367 if not node1 and not node2:
2368 node1 = repo.dirstate.p1()
2368 node1 = repo.dirstate.p1()
2369
2369
2370 def lrugetfilectx():
2370 def lrugetfilectx():
2371 cache = {}
2371 cache = {}
2372 order = collections.deque()
2372 order = collections.deque()
2373 def getfilectx(f, ctx):
2373 def getfilectx(f, ctx):
2374 fctx = ctx.filectx(f, filelog=cache.get(f))
2374 fctx = ctx.filectx(f, filelog=cache.get(f))
2375 if f not in cache:
2375 if f not in cache:
2376 if len(cache) > 20:
2376 if len(cache) > 20:
2377 del cache[order.popleft()]
2377 del cache[order.popleft()]
2378 cache[f] = fctx.filelog()
2378 cache[f] = fctx.filelog()
2379 else:
2379 else:
2380 order.remove(f)
2380 order.remove(f)
2381 order.append(f)
2381 order.append(f)
2382 return fctx
2382 return fctx
2383 return getfilectx
2383 return getfilectx
2384 getfilectx = lrugetfilectx()
2384 getfilectx = lrugetfilectx()
2385
2385
2386 ctx1 = repo[node1]
2386 ctx1 = repo[node1]
2387 ctx2 = repo[node2]
2387 ctx2 = repo[node2]
2388
2388
2389 relfiltered = False
2389 relfiltered = False
2390 if relroot != '' and match.always():
2390 if relroot != '' and match.always():
2391 # as a special case, create a new matcher with just the relroot
2391 # as a special case, create a new matcher with just the relroot
2392 pats = [relroot]
2392 pats = [relroot]
2393 match = scmutil.match(ctx2, pats, default='path')
2393 match = scmutil.match(ctx2, pats, default='path')
2394 relfiltered = True
2394 relfiltered = True
2395
2395
2396 if not changes:
2396 if not changes:
2397 changes = repo.status(ctx1, ctx2, match=match)
2397 changes = repo.status(ctx1, ctx2, match=match)
2398 modified, added, removed = changes[:3]
2398 modified, added, removed = changes[:3]
2399
2399
2400 if not modified and not added and not removed:
2400 if not modified and not added and not removed:
2401 return []
2401 return []
2402
2402
2403 if repo.ui.debugflag:
2403 if repo.ui.debugflag:
2404 hexfunc = hex
2404 hexfunc = hex
2405 else:
2405 else:
2406 hexfunc = short
2406 hexfunc = short
2407 revs = [hexfunc(node) for node in [ctx1.node(), ctx2.node()] if node]
2407 revs = [hexfunc(node) for node in [ctx1.node(), ctx2.node()] if node]
2408
2408
2409 if copy is None:
2409 if copy is None:
2410 copy = {}
2410 copy = {}
2411 if opts.git or opts.upgrade:
2411 if opts.git or opts.upgrade:
2412 copy = copies.pathcopies(ctx1, ctx2, match=match)
2412 copy = copies.pathcopies(ctx1, ctx2, match=match)
2413
2413
2414 if relroot is not None:
2414 if relroot is not None:
2415 if not relfiltered:
2415 if not relfiltered:
2416 # XXX this would ideally be done in the matcher, but that is
2416 # XXX this would ideally be done in the matcher, but that is
2417 # generally meant to 'or' patterns, not 'and' them. In this case we
2417 # generally meant to 'or' patterns, not 'and' them. In this case we
2418 # need to 'and' all the patterns from the matcher with relroot.
2418 # need to 'and' all the patterns from the matcher with relroot.
2419 def filterrel(l):
2419 def filterrel(l):
2420 return [f for f in l if f.startswith(relroot)]
2420 return [f for f in l if f.startswith(relroot)]
2421 modified = filterrel(modified)
2421 modified = filterrel(modified)
2422 added = filterrel(added)
2422 added = filterrel(added)
2423 removed = filterrel(removed)
2423 removed = filterrel(removed)
2424 relfiltered = True
2424 relfiltered = True
2425 # filter out copies where either side isn't inside the relative root
2425 # filter out copies where either side isn't inside the relative root
2426 copy = dict(((dst, src) for (dst, src) in copy.iteritems()
2426 copy = dict(((dst, src) for (dst, src) in copy.iteritems()
2427 if dst.startswith(relroot)
2427 if dst.startswith(relroot)
2428 and src.startswith(relroot)))
2428 and src.startswith(relroot)))
2429
2429
2430 modifiedset = set(modified)
2430 modifiedset = set(modified)
2431 addedset = set(added)
2431 addedset = set(added)
2432 removedset = set(removed)
2432 removedset = set(removed)
2433 for f in modified:
2433 for f in modified:
2434 if f not in ctx1:
2434 if f not in ctx1:
2435 # Fix up added, since merged-in additions appear as
2435 # Fix up added, since merged-in additions appear as
2436 # modifications during merges
2436 # modifications during merges
2437 modifiedset.remove(f)
2437 modifiedset.remove(f)
2438 addedset.add(f)
2438 addedset.add(f)
2439 for f in removed:
2439 for f in removed:
2440 if f not in ctx1:
2440 if f not in ctx1:
2441 # Merged-in additions that are then removed are reported as removed.
2441 # Merged-in additions that are then removed are reported as removed.
2442 # They are not in ctx1, so We don't want to show them in the diff.
2442 # They are not in ctx1, so We don't want to show them in the diff.
2443 removedset.remove(f)
2443 removedset.remove(f)
2444 modified = sorted(modifiedset)
2444 modified = sorted(modifiedset)
2445 added = sorted(addedset)
2445 added = sorted(addedset)
2446 removed = sorted(removedset)
2446 removed = sorted(removedset)
2447 for dst, src in list(copy.items()):
2447 for dst, src in list(copy.items()):
2448 if src not in ctx1:
2448 if src not in ctx1:
2449 # Files merged in during a merge and then copied/renamed are
2449 # Files merged in during a merge and then copied/renamed are
2450 # reported as copies. We want to show them in the diff as additions.
2450 # reported as copies. We want to show them in the diff as additions.
2451 del copy[dst]
2451 del copy[dst]
2452
2452
2453 def difffn(opts, losedata):
2453 def difffn(opts, losedata):
2454 return trydiff(repo, revs, ctx1, ctx2, modified, added, removed,
2454 return trydiff(repo, revs, ctx1, ctx2, modified, added, removed,
2455 copy, getfilectx, opts, losedata, prefix, relroot)
2455 copy, getfilectx, opts, losedata, prefix, relroot)
2456 if opts.upgrade and not opts.git:
2456 if opts.upgrade and not opts.git:
2457 try:
2457 try:
2458 def losedata(fn):
2458 def losedata(fn):
2459 if not losedatafn or not losedatafn(fn=fn):
2459 if not losedatafn or not losedatafn(fn=fn):
2460 raise GitDiffRequired
2460 raise GitDiffRequired
2461 # Buffer the whole output until we are sure it can be generated
2461 # Buffer the whole output until we are sure it can be generated
2462 return list(difffn(opts.copy(git=False), losedata))
2462 return list(difffn(opts.copy(git=False), losedata))
2463 except GitDiffRequired:
2463 except GitDiffRequired:
2464 return difffn(opts.copy(git=True), None)
2464 return difffn(opts.copy(git=True), None)
2465 else:
2465 else:
2466 return difffn(opts, None)
2466 return difffn(opts, None)
2467
2467
2468 def difflabel(func, *args, **kw):
2468 def difflabel(func, *args, **kw):
2469 '''yields 2-tuples of (output, label) based on the output of func()'''
2469 '''yields 2-tuples of (output, label) based on the output of func()'''
2470 inlinecolor = False
2470 inlinecolor = False
2471 if kw.get(r'opts'):
2471 if kw.get(r'opts'):
2472 inlinecolor = kw[r'opts'].worddiff
2472 inlinecolor = kw[r'opts'].worddiff
2473 headprefixes = [('diff', 'diff.diffline'),
2473 headprefixes = [('diff', 'diff.diffline'),
2474 ('copy', 'diff.extended'),
2474 ('copy', 'diff.extended'),
2475 ('rename', 'diff.extended'),
2475 ('rename', 'diff.extended'),
2476 ('old', 'diff.extended'),
2476 ('old', 'diff.extended'),
2477 ('new', 'diff.extended'),
2477 ('new', 'diff.extended'),
2478 ('deleted', 'diff.extended'),
2478 ('deleted', 'diff.extended'),
2479 ('index', 'diff.extended'),
2479 ('index', 'diff.extended'),
2480 ('similarity', 'diff.extended'),
2480 ('similarity', 'diff.extended'),
2481 ('---', 'diff.file_a'),
2481 ('---', 'diff.file_a'),
2482 ('+++', 'diff.file_b')]
2482 ('+++', 'diff.file_b')]
2483 textprefixes = [('@', 'diff.hunk'),
2483 textprefixes = [('@', 'diff.hunk'),
2484 ('-', 'diff.deleted'),
2484 ('-', 'diff.deleted'),
2485 ('+', 'diff.inserted')]
2485 ('+', 'diff.inserted')]
2486 head = False
2486 head = False
2487 for chunk in func(*args, **kw):
2487 for chunk in func(*args, **kw):
2488 lines = chunk.split('\n')
2488 lines = chunk.split('\n')
2489 matches = {}
2489 matches = {}
2490 if inlinecolor:
2490 if inlinecolor:
2491 matches = _findmatches(lines)
2491 matches = _findmatches(lines)
2492 for i, line in enumerate(lines):
2492 for i, line in enumerate(lines):
2493 if i != 0:
2493 if i != 0:
2494 yield ('\n', '')
2494 yield ('\n', '')
2495 if head:
2495 if head:
2496 if line.startswith('@'):
2496 if line.startswith('@'):
2497 head = False
2497 head = False
2498 else:
2498 else:
2499 if line and line[0] not in ' +-@\\':
2499 if line and line[0] not in ' +-@\\':
2500 head = True
2500 head = True
2501 stripline = line
2501 stripline = line
2502 diffline = False
2502 diffline = False
2503 if not head and line and line[0] in '+-':
2503 if not head and line and line[0] in '+-':
2504 # highlight tabs and trailing whitespace, but only in
2504 # highlight tabs and trailing whitespace, but only in
2505 # changed lines
2505 # changed lines
2506 stripline = line.rstrip()
2506 stripline = line.rstrip()
2507 diffline = True
2507 diffline = True
2508
2508
2509 prefixes = textprefixes
2509 prefixes = textprefixes
2510 if head:
2510 if head:
2511 prefixes = headprefixes
2511 prefixes = headprefixes
2512 for prefix, label in prefixes:
2512 for prefix, label in prefixes:
2513 if stripline.startswith(prefix):
2513 if stripline.startswith(prefix):
2514 if diffline:
2514 if diffline:
2515 if i in matches:
2515 if i in matches:
2516 for t, l in _inlinediff(lines[i].rstrip(),
2516 for t, l in _inlinediff(lines[i].rstrip(),
2517 lines[matches[i]].rstrip(),
2517 lines[matches[i]].rstrip(),
2518 label):
2518 label):
2519 yield (t, l)
2519 yield (t, l)
2520 else:
2520 else:
2521 for token in tabsplitter.findall(stripline):
2521 for token in tabsplitter.findall(stripline):
2522 if '\t' == token[0]:
2522 if '\t' == token[0]:
2523 yield (token, 'diff.tab')
2523 yield (token, 'diff.tab')
2524 else:
2524 else:
2525 yield (token, label)
2525 yield (token, label)
2526 else:
2526 else:
2527 yield (stripline, label)
2527 yield (stripline, label)
2528 break
2528 break
2529 else:
2529 else:
2530 yield (line, '')
2530 yield (line, '')
2531 if line != stripline:
2531 if line != stripline:
2532 yield (line[len(stripline):], 'diff.trailingwhitespace')
2532 yield (line[len(stripline):], 'diff.trailingwhitespace')
2533
2533
2534 def _findmatches(slist):
2534 def _findmatches(slist):
2535 '''Look for insertion matches to deletion and returns a dict of
2535 '''Look for insertion matches to deletion and returns a dict of
2536 correspondences.
2536 correspondences.
2537 '''
2537 '''
2538 lastmatch = 0
2538 lastmatch = 0
2539 matches = {}
2539 matches = {}
2540 for i, line in enumerate(slist):
2540 for i, line in enumerate(slist):
2541 if line == '':
2541 if line == '':
2542 continue
2542 continue
2543 if line[0] == '-':
2543 if line[0] == '-':
2544 lastmatch = max(lastmatch, i)
2544 lastmatch = max(lastmatch, i)
2545 newgroup = False
2545 newgroup = False
2546 for j, newline in enumerate(slist[lastmatch + 1:]):
2546 for j, newline in enumerate(slist[lastmatch + 1:]):
2547 if newline == '':
2547 if newline == '':
2548 continue
2548 continue
2549 if newline[0] == '-' and newgroup: # too far, no match
2549 if newline[0] == '-' and newgroup: # too far, no match
2550 break
2550 break
2551 if newline[0] == '+': # potential match
2551 if newline[0] == '+': # potential match
2552 newgroup = True
2552 newgroup = True
2553 sim = difflib.SequenceMatcher(None, line, newline).ratio()
2553 sim = difflib.SequenceMatcher(None, line, newline).ratio()
2554 if sim > 0.7:
2554 if sim > 0.7:
2555 lastmatch = lastmatch + 1 + j
2555 lastmatch = lastmatch + 1 + j
2556 matches[i] = lastmatch
2556 matches[i] = lastmatch
2557 matches[lastmatch] = i
2557 matches[lastmatch] = i
2558 break
2558 break
2559 return matches
2559 return matches
2560
2560
2561 def _inlinediff(s1, s2, operation):
2561 def _inlinediff(s1, s2, operation):
2562 '''Perform string diff to highlight specific changes.'''
2562 '''Perform string diff to highlight specific changes.'''
2563 operation_skip = '+?' if operation == 'diff.deleted' else '-?'
2563 operation_skip = '+?' if operation == 'diff.deleted' else '-?'
2564 if operation == 'diff.deleted':
2564 if operation == 'diff.deleted':
2565 s2, s1 = s1, s2
2565 s2, s1 = s1, s2
2566
2566
2567 buff = []
2567 buff = []
2568 # we never want to higlight the leading +-
2568 # we never want to higlight the leading +-
2569 if operation == 'diff.deleted' and s2.startswith('-'):
2569 if operation == 'diff.deleted' and s2.startswith('-'):
2570 label = operation
2570 label = operation
2571 token = '-'
2571 token = '-'
2572 s2 = s2[1:]
2572 s2 = s2[1:]
2573 s1 = s1[1:]
2573 s1 = s1[1:]
2574 elif operation == 'diff.inserted' and s1.startswith('+'):
2574 elif operation == 'diff.inserted' and s1.startswith('+'):
2575 label = operation
2575 label = operation
2576 token = '+'
2576 token = '+'
2577 s2 = s2[1:]
2577 s2 = s2[1:]
2578 s1 = s1[1:]
2578 s1 = s1[1:]
2579 else:
2579 else:
2580 raise error.ProgrammingError("Case not expected, operation = %s" %
2580 raise error.ProgrammingError("Case not expected, operation = %s" %
2581 operation)
2581 operation)
2582
2582
2583 s = difflib.ndiff(_nonwordre.split(s2), _nonwordre.split(s1))
2583 s = difflib.ndiff(_nonwordre.split(s2), _nonwordre.split(s1))
2584 for part in s:
2584 for part in s:
2585 if part[0] in operation_skip or len(part) == 2:
2585 if part[0] in operation_skip or len(part) == 2:
2586 continue
2586 continue
2587 l = operation + '.highlight'
2587 l = operation + '.highlight'
2588 if part[0] in ' ':
2588 if part[0] in ' ':
2589 l = operation
2589 l = operation
2590 if part[2:] == '\t':
2590 if part[2:] == '\t':
2591 l = 'diff.tab'
2591 l = 'diff.tab'
2592 if l == label: # contiguous token with same label
2592 if l == label: # contiguous token with same label
2593 token += part[2:]
2593 token += part[2:]
2594 continue
2594 continue
2595 else:
2595 else:
2596 buff.append((token, label))
2596 buff.append((token, label))
2597 label = l
2597 label = l
2598 token = part[2:]
2598 token = part[2:]
2599 buff.append((token, label))
2599 buff.append((token, label))
2600
2600
2601 return buff
2601 return buff
2602
2602
2603 def diffui(*args, **kw):
2603 def diffui(*args, **kw):
2604 '''like diff(), but yields 2-tuples of (output, label) for ui.write()'''
2604 '''like diff(), but yields 2-tuples of (output, label) for ui.write()'''
2605 return difflabel(diff, *args, **kw)
2605 return difflabel(diff, *args, **kw)
2606
2606
2607 def _filepairs(modified, added, removed, copy, opts):
2607 def _filepairs(modified, added, removed, copy, opts):
2608 '''generates tuples (f1, f2, copyop), where f1 is the name of the file
2608 '''generates tuples (f1, f2, copyop), where f1 is the name of the file
2609 before and f2 is the the name after. For added files, f1 will be None,
2609 before and f2 is the the name after. For added files, f1 will be None,
2610 and for removed files, f2 will be None. copyop may be set to None, 'copy'
2610 and for removed files, f2 will be None. copyop may be set to None, 'copy'
2611 or 'rename' (the latter two only if opts.git is set).'''
2611 or 'rename' (the latter two only if opts.git is set).'''
2612 gone = set()
2612 gone = set()
2613
2613
2614 copyto = dict([(v, k) for k, v in copy.items()])
2614 copyto = dict([(v, k) for k, v in copy.items()])
2615
2615
2616 addedset, removedset = set(added), set(removed)
2616 addedset, removedset = set(added), set(removed)
2617
2617
2618 for f in sorted(modified + added + removed):
2618 for f in sorted(modified + added + removed):
2619 copyop = None
2619 copyop = None
2620 f1, f2 = f, f
2620 f1, f2 = f, f
2621 if f in addedset:
2621 if f in addedset:
2622 f1 = None
2622 f1 = None
2623 if f in copy:
2623 if f in copy:
2624 if opts.git:
2624 if opts.git:
2625 f1 = copy[f]
2625 f1 = copy[f]
2626 if f1 in removedset and f1 not in gone:
2626 if f1 in removedset and f1 not in gone:
2627 copyop = 'rename'
2627 copyop = 'rename'
2628 gone.add(f1)
2628 gone.add(f1)
2629 else:
2629 else:
2630 copyop = 'copy'
2630 copyop = 'copy'
2631 elif f in removedset:
2631 elif f in removedset:
2632 f2 = None
2632 f2 = None
2633 if opts.git:
2633 if opts.git:
2634 # have we already reported a copy above?
2634 # have we already reported a copy above?
2635 if (f in copyto and copyto[f] in addedset
2635 if (f in copyto and copyto[f] in addedset
2636 and copy[copyto[f]] == f):
2636 and copy[copyto[f]] == f):
2637 continue
2637 continue
2638 yield f1, f2, copyop
2638 yield f1, f2, copyop
2639
2639
2640 def trydiff(repo, revs, ctx1, ctx2, modified, added, removed,
2640 def trydiff(repo, revs, ctx1, ctx2, modified, added, removed,
2641 copy, getfilectx, opts, losedatafn, prefix, relroot):
2641 copy, getfilectx, opts, losedatafn, prefix, relroot):
2642 '''given input data, generate a diff and yield it in blocks
2642 '''given input data, generate a diff and yield it in blocks
2643
2643
2644 If generating a diff would lose data like flags or binary data and
2644 If generating a diff would lose data like flags or binary data and
2645 losedatafn is not None, it will be called.
2645 losedatafn is not None, it will be called.
2646
2646
2647 relroot is removed and prefix is added to every path in the diff output.
2647 relroot is removed and prefix is added to every path in the diff output.
2648
2648
2649 If relroot is not empty, this function expects every path in modified,
2649 If relroot is not empty, this function expects every path in modified,
2650 added, removed and copy to start with it.'''
2650 added, removed and copy to start with it.'''
2651
2651
2652 def gitindex(text):
2652 def gitindex(text):
2653 if not text:
2653 if not text:
2654 text = ""
2654 text = ""
2655 l = len(text)
2655 l = len(text)
2656 s = hashlib.sha1('blob %d\0' % l)
2656 s = hashlib.sha1('blob %d\0' % l)
2657 s.update(text)
2657 s.update(text)
2658 return hex(s.digest())
2658 return hex(s.digest())
2659
2659
2660 if opts.noprefix:
2660 if opts.noprefix:
2661 aprefix = bprefix = ''
2661 aprefix = bprefix = ''
2662 else:
2662 else:
2663 aprefix = 'a/'
2663 aprefix = 'a/'
2664 bprefix = 'b/'
2664 bprefix = 'b/'
2665
2665
2666 def diffline(f, revs):
2666 def diffline(f, revs):
2667 revinfo = ' '.join(["-r %s" % rev for rev in revs])
2667 revinfo = ' '.join(["-r %s" % rev for rev in revs])
2668 return 'diff %s %s' % (revinfo, f)
2668 return 'diff %s %s' % (revinfo, f)
2669
2669
2670 def isempty(fctx):
2670 def isempty(fctx):
2671 return fctx is None or fctx.size() == 0
2671 return fctx is None or fctx.size() == 0
2672
2672
2673 date1 = util.datestr(ctx1.date())
2673 date1 = util.datestr(ctx1.date())
2674 date2 = util.datestr(ctx2.date())
2674 date2 = util.datestr(ctx2.date())
2675
2675
2676 gitmode = {'l': '120000', 'x': '100755', '': '100644'}
2676 gitmode = {'l': '120000', 'x': '100755', '': '100644'}
2677
2677
2678 if relroot != '' and (repo.ui.configbool('devel', 'all-warnings')
2678 if relroot != '' and (repo.ui.configbool('devel', 'all-warnings')
2679 or repo.ui.configbool('devel', 'check-relroot')):
2679 or repo.ui.configbool('devel', 'check-relroot')):
2680 for f in modified + added + removed + list(copy) + list(copy.values()):
2680 for f in modified + added + removed + list(copy) + list(copy.values()):
2681 if f is not None and not f.startswith(relroot):
2681 if f is not None and not f.startswith(relroot):
2682 raise AssertionError(
2682 raise AssertionError(
2683 "file %s doesn't start with relroot %s" % (f, relroot))
2683 "file %s doesn't start with relroot %s" % (f, relroot))
2684
2684
2685 for f1, f2, copyop in _filepairs(modified, added, removed, copy, opts):
2685 for f1, f2, copyop in _filepairs(modified, added, removed, copy, opts):
2686 content1 = None
2686 content1 = None
2687 content2 = None
2687 content2 = None
2688 fctx1 = None
2688 fctx1 = None
2689 fctx2 = None
2689 fctx2 = None
2690 flag1 = None
2690 flag1 = None
2691 flag2 = None
2691 flag2 = None
2692 if f1:
2692 if f1:
2693 fctx1 = getfilectx(f1, ctx1)
2693 fctx1 = getfilectx(f1, ctx1)
2694 if opts.git or losedatafn:
2694 if opts.git or losedatafn:
2695 flag1 = ctx1.flags(f1)
2695 flag1 = ctx1.flags(f1)
2696 if f2:
2696 if f2:
2697 fctx2 = getfilectx(f2, ctx2)
2697 fctx2 = getfilectx(f2, ctx2)
2698 if opts.git or losedatafn:
2698 if opts.git or losedatafn:
2699 flag2 = ctx2.flags(f2)
2699 flag2 = ctx2.flags(f2)
2700 # if binary is True, output "summary" or "base85", but not "text diff"
2700 # if binary is True, output "summary" or "base85", but not "text diff"
2701 binary = not opts.text and any(f.isbinary()
2701 if opts.text:
2702 check_binary = True
2703 binary = False
2704 else:
2705 check_binary = any(f.isbinary()
2702 for f in [fctx1, fctx2] if f is not None)
2706 for f in [fctx1, fctx2] if f is not None)
2707 binary = check_binary
2703
2708
2704 if losedatafn and not opts.git:
2709 if losedatafn and not opts.git:
2705 if (binary or
2710 if (binary or
2706 # copy/rename
2711 # copy/rename
2707 f2 in copy or
2712 f2 in copy or
2708 # empty file creation
2713 # empty file creation
2709 (not f1 and isempty(fctx2)) or
2714 (not f1 and isempty(fctx2)) or
2710 # empty file deletion
2715 # empty file deletion
2711 (isempty(fctx1) and not f2) or
2716 (isempty(fctx1) and not f2) or
2712 # create with flags
2717 # create with flags
2713 (not f1 and flag2) or
2718 (not f1 and flag2) or
2714 # change flags
2719 # change flags
2715 (f1 and f2 and flag1 != flag2)):
2720 (f1 and f2 and flag1 != flag2)):
2716 losedatafn(f2 or f1)
2721 losedatafn(f2 or f1)
2717
2722
2718 path1 = f1 or f2
2723 path1 = f1 or f2
2719 path2 = f2 or f1
2724 path2 = f2 or f1
2720 path1 = posixpath.join(prefix, path1[len(relroot):])
2725 path1 = posixpath.join(prefix, path1[len(relroot):])
2721 path2 = posixpath.join(prefix, path2[len(relroot):])
2726 path2 = posixpath.join(prefix, path2[len(relroot):])
2722 header = []
2727 header = []
2723 if opts.git:
2728 if opts.git:
2724 header.append('diff --git %s%s %s%s' %
2729 header.append('diff --git %s%s %s%s' %
2725 (aprefix, path1, bprefix, path2))
2730 (aprefix, path1, bprefix, path2))
2726 if not f1: # added
2731 if not f1: # added
2727 header.append('new file mode %s' % gitmode[flag2])
2732 header.append('new file mode %s' % gitmode[flag2])
2728 elif not f2: # removed
2733 elif not f2: # removed
2729 header.append('deleted file mode %s' % gitmode[flag1])
2734 header.append('deleted file mode %s' % gitmode[flag1])
2730 else: # modified/copied/renamed
2735 else: # modified/copied/renamed
2731 mode1, mode2 = gitmode[flag1], gitmode[flag2]
2736 mode1, mode2 = gitmode[flag1], gitmode[flag2]
2732 if mode1 != mode2:
2737 if mode1 != mode2:
2733 header.append('old mode %s' % mode1)
2738 header.append('old mode %s' % mode1)
2734 header.append('new mode %s' % mode2)
2739 header.append('new mode %s' % mode2)
2735 if copyop is not None:
2740 if copyop is not None:
2736 if opts.showsimilarity:
2741 if opts.showsimilarity:
2737 sim = similar.score(ctx1[path1], ctx2[path2]) * 100
2742 sim = similar.score(ctx1[path1], ctx2[path2]) * 100
2738 header.append('similarity index %d%%' % sim)
2743 header.append('similarity index %d%%' % sim)
2739 header.append('%s from %s' % (copyop, path1))
2744 header.append('%s from %s' % (copyop, path1))
2740 header.append('%s to %s' % (copyop, path2))
2745 header.append('%s to %s' % (copyop, path2))
2741 elif revs and not repo.ui.quiet:
2746 elif revs and not repo.ui.quiet:
2742 header.append(diffline(path1, revs))
2747 header.append(diffline(path1, revs))
2743
2748
2744 # fctx.is | diffopts | what to | is fctx.data()
2749 # fctx.is | diffopts | what to | is fctx.data()
2745 # binary() | text nobinary git index | output? | outputted?
2750 # binary() | text nobinary git index | output? | outputted?
2746 # ------------------------------------|----------------------------
2751 # ------------------------------------|----------------------------
2747 # yes | no no no * | summary | no
2752 # yes | no no no * | summary | no
2748 # yes | no no yes * | base85 | yes
2753 # yes | no no yes * | base85 | yes
2749 # yes | no yes no * | summary | no
2754 # yes | no yes no * | summary | no
2750 # yes | no yes yes 0 | summary | no
2755 # yes | no yes yes 0 | summary | no
2751 # yes | no yes yes >0 | summary | semi [1]
2756 # yes | no yes yes >0 | summary | semi [1]
2752 # yes | yes * * * | text diff | yes
2757 # yes | yes * * * | text diff | yes
2753 # no | * * * * | text diff | yes
2758 # no | * * * * | text diff | yes
2754 # [1]: hash(fctx.data()) is outputted. so fctx.data() cannot be faked
2759 # [1]: hash(fctx.data()) is outputted. so fctx.data() cannot be faked
2755 if binary and (not opts.git or (opts.git and opts.nobinary and not
2760 if binary and (not opts.git or (opts.git and opts.nobinary and not
2756 opts.index)):
2761 opts.index)):
2757 # fast path: no binary content will be displayed, content1 and
2762 # fast path: no binary content will be displayed, content1 and
2758 # content2 are only used for equivalent test. cmp() could have a
2763 # content2 are only used for equivalent test. cmp() could have a
2759 # fast path.
2764 # fast path.
2760 if fctx1 is not None:
2765 if fctx1 is not None:
2761 content1 = b'\0'
2766 content1 = b'\0'
2762 if fctx2 is not None:
2767 if fctx2 is not None:
2763 if fctx1 is not None and not fctx1.cmp(fctx2):
2768 if fctx1 is not None and not fctx1.cmp(fctx2):
2764 content2 = b'\0' # not different
2769 content2 = b'\0' # not different
2765 else:
2770 else:
2766 content2 = b'\0\0'
2771 content2 = b'\0\0'
2767 else:
2772 else:
2768 # normal path: load contents
2773 # normal path: load contents
2769 if fctx1 is not None:
2774 if fctx1 is not None:
2770 content1 = fctx1.data()
2775 content1 = fctx1.data()
2771 if fctx2 is not None:
2776 if fctx2 is not None:
2772 content2 = fctx2.data()
2777 content2 = fctx2.data()
2773
2778
2774 if binary and opts.git and not opts.nobinary:
2779 if binary and opts.git and not opts.nobinary:
2775 text = mdiff.b85diff(content1, content2)
2780 text = mdiff.b85diff(content1, content2)
2776 if text:
2781 if text:
2777 header.append('index %s..%s' %
2782 header.append('index %s..%s' %
2778 (gitindex(content1), gitindex(content2)))
2783 (gitindex(content1), gitindex(content2)))
2779 hunks = (None, [text]),
2784 hunks = (None, [text]),
2780 else:
2785 else:
2781 if opts.git and opts.index > 0:
2786 if opts.git and opts.index > 0:
2782 flag = flag1
2787 flag = flag1
2783 if flag is None:
2788 if flag is None:
2784 flag = flag2
2789 flag = flag2
2785 header.append('index %s..%s %s' %
2790 header.append('index %s..%s %s' %
2786 (gitindex(content1)[0:opts.index],
2791 (gitindex(content1)[0:opts.index],
2787 gitindex(content2)[0:opts.index],
2792 gitindex(content2)[0:opts.index],
2788 gitmode[flag]))
2793 gitmode[flag]))
2789
2794
2790 uheaders, hunks = mdiff.unidiff(content1, date1,
2795 uheaders, hunks = mdiff.unidiff(content1, date1,
2791 content2, date2,
2796 content2, date2,
2792 path1, path2, opts=opts)
2797 path1, path2, opts=opts,
2798 check_binary=check_binary)
2793 header.extend(uheaders)
2799 header.extend(uheaders)
2794 yield fctx1, fctx2, header, hunks
2800 yield fctx1, fctx2, header, hunks
2795
2801
2796 def diffstatsum(stats):
2802 def diffstatsum(stats):
2797 maxfile, maxtotal, addtotal, removetotal, binary = 0, 0, 0, 0, False
2803 maxfile, maxtotal, addtotal, removetotal, binary = 0, 0, 0, 0, False
2798 for f, a, r, b in stats:
2804 for f, a, r, b in stats:
2799 maxfile = max(maxfile, encoding.colwidth(f))
2805 maxfile = max(maxfile, encoding.colwidth(f))
2800 maxtotal = max(maxtotal, a + r)
2806 maxtotal = max(maxtotal, a + r)
2801 addtotal += a
2807 addtotal += a
2802 removetotal += r
2808 removetotal += r
2803 binary = binary or b
2809 binary = binary or b
2804
2810
2805 return maxfile, maxtotal, addtotal, removetotal, binary
2811 return maxfile, maxtotal, addtotal, removetotal, binary
2806
2812
2807 def diffstatdata(lines):
2813 def diffstatdata(lines):
2808 diffre = re.compile('^diff .*-r [a-z0-9]+\s(.*)$')
2814 diffre = re.compile('^diff .*-r [a-z0-9]+\s(.*)$')
2809
2815
2810 results = []
2816 results = []
2811 filename, adds, removes, isbinary = None, 0, 0, False
2817 filename, adds, removes, isbinary = None, 0, 0, False
2812
2818
2813 def addresult():
2819 def addresult():
2814 if filename:
2820 if filename:
2815 results.append((filename, adds, removes, isbinary))
2821 results.append((filename, adds, removes, isbinary))
2816
2822
2817 # inheader is used to track if a line is in the
2823 # inheader is used to track if a line is in the
2818 # header portion of the diff. This helps properly account
2824 # header portion of the diff. This helps properly account
2819 # for lines that start with '--' or '++'
2825 # for lines that start with '--' or '++'
2820 inheader = False
2826 inheader = False
2821
2827
2822 for line in lines:
2828 for line in lines:
2823 if line.startswith('diff'):
2829 if line.startswith('diff'):
2824 addresult()
2830 addresult()
2825 # starting a new file diff
2831 # starting a new file diff
2826 # set numbers to 0 and reset inheader
2832 # set numbers to 0 and reset inheader
2827 inheader = True
2833 inheader = True
2828 adds, removes, isbinary = 0, 0, False
2834 adds, removes, isbinary = 0, 0, False
2829 if line.startswith('diff --git a/'):
2835 if line.startswith('diff --git a/'):
2830 filename = gitre.search(line).group(2)
2836 filename = gitre.search(line).group(2)
2831 elif line.startswith('diff -r'):
2837 elif line.startswith('diff -r'):
2832 # format: "diff -r ... -r ... filename"
2838 # format: "diff -r ... -r ... filename"
2833 filename = diffre.search(line).group(1)
2839 filename = diffre.search(line).group(1)
2834 elif line.startswith('@@'):
2840 elif line.startswith('@@'):
2835 inheader = False
2841 inheader = False
2836 elif line.startswith('+') and not inheader:
2842 elif line.startswith('+') and not inheader:
2837 adds += 1
2843 adds += 1
2838 elif line.startswith('-') and not inheader:
2844 elif line.startswith('-') and not inheader:
2839 removes += 1
2845 removes += 1
2840 elif (line.startswith('GIT binary patch') or
2846 elif (line.startswith('GIT binary patch') or
2841 line.startswith('Binary file')):
2847 line.startswith('Binary file')):
2842 isbinary = True
2848 isbinary = True
2843 addresult()
2849 addresult()
2844 return results
2850 return results
2845
2851
2846 def diffstat(lines, width=80):
2852 def diffstat(lines, width=80):
2847 output = []
2853 output = []
2848 stats = diffstatdata(lines)
2854 stats = diffstatdata(lines)
2849 maxname, maxtotal, totaladds, totalremoves, hasbinary = diffstatsum(stats)
2855 maxname, maxtotal, totaladds, totalremoves, hasbinary = diffstatsum(stats)
2850
2856
2851 countwidth = len(str(maxtotal))
2857 countwidth = len(str(maxtotal))
2852 if hasbinary and countwidth < 3:
2858 if hasbinary and countwidth < 3:
2853 countwidth = 3
2859 countwidth = 3
2854 graphwidth = width - countwidth - maxname - 6
2860 graphwidth = width - countwidth - maxname - 6
2855 if graphwidth < 10:
2861 if graphwidth < 10:
2856 graphwidth = 10
2862 graphwidth = 10
2857
2863
2858 def scale(i):
2864 def scale(i):
2859 if maxtotal <= graphwidth:
2865 if maxtotal <= graphwidth:
2860 return i
2866 return i
2861 # If diffstat runs out of room it doesn't print anything,
2867 # If diffstat runs out of room it doesn't print anything,
2862 # which isn't very useful, so always print at least one + or -
2868 # which isn't very useful, so always print at least one + or -
2863 # if there were at least some changes.
2869 # if there were at least some changes.
2864 return max(i * graphwidth // maxtotal, int(bool(i)))
2870 return max(i * graphwidth // maxtotal, int(bool(i)))
2865
2871
2866 for filename, adds, removes, isbinary in stats:
2872 for filename, adds, removes, isbinary in stats:
2867 if isbinary:
2873 if isbinary:
2868 count = 'Bin'
2874 count = 'Bin'
2869 else:
2875 else:
2870 count = '%d' % (adds + removes)
2876 count = '%d' % (adds + removes)
2871 pluses = '+' * scale(adds)
2877 pluses = '+' * scale(adds)
2872 minuses = '-' * scale(removes)
2878 minuses = '-' * scale(removes)
2873 output.append(' %s%s | %*s %s%s\n' %
2879 output.append(' %s%s | %*s %s%s\n' %
2874 (filename, ' ' * (maxname - encoding.colwidth(filename)),
2880 (filename, ' ' * (maxname - encoding.colwidth(filename)),
2875 countwidth, count, pluses, minuses))
2881 countwidth, count, pluses, minuses))
2876
2882
2877 if stats:
2883 if stats:
2878 output.append(_(' %d files changed, %d insertions(+), '
2884 output.append(_(' %d files changed, %d insertions(+), '
2879 '%d deletions(-)\n')
2885 '%d deletions(-)\n')
2880 % (len(stats), totaladds, totalremoves))
2886 % (len(stats), totaladds, totalremoves))
2881
2887
2882 return ''.join(output)
2888 return ''.join(output)
2883
2889
2884 def diffstatui(*args, **kw):
2890 def diffstatui(*args, **kw):
2885 '''like diffstat(), but yields 2-tuples of (output, label) for
2891 '''like diffstat(), but yields 2-tuples of (output, label) for
2886 ui.write()
2892 ui.write()
2887 '''
2893 '''
2888
2894
2889 for line in diffstat(*args, **kw).splitlines():
2895 for line in diffstat(*args, **kw).splitlines():
2890 if line and line[-1] in '+-':
2896 if line and line[-1] in '+-':
2891 name, graph = line.rsplit(' ', 1)
2897 name, graph = line.rsplit(' ', 1)
2892 yield (name + ' ', '')
2898 yield (name + ' ', '')
2893 m = re.search(br'\++', graph)
2899 m = re.search(br'\++', graph)
2894 if m:
2900 if m:
2895 yield (m.group(0), 'diffstat.inserted')
2901 yield (m.group(0), 'diffstat.inserted')
2896 m = re.search(br'-+', graph)
2902 m = re.search(br'-+', graph)
2897 if m:
2903 if m:
2898 yield (m.group(0), 'diffstat.deleted')
2904 yield (m.group(0), 'diffstat.deleted')
2899 else:
2905 else:
2900 yield (line, '')
2906 yield (line, '')
2901 yield ('\n', '')
2907 yield ('\n', '')
General Comments 0
You need to be logged in to leave comments. Login now