##// END OF EJS Templates
patch: do not break up multibyte character when highlighting word...
Yuya Nishihara -
r35384:82c37623 default
parent child Browse files
Show More
@@ -1,2899 +1,2900 b''
1 1 # patch.py - patch file parsing routines
2 2 #
3 3 # Copyright 2006 Brendan Cully <brendan@kublai.com>
4 4 # Copyright 2007 Chris Mason <chris.mason@oracle.com>
5 5 #
6 6 # This software may be used and distributed according to the terms of the
7 7 # GNU General Public License version 2 or any later version.
8 8
9 9 from __future__ import absolute_import, print_function
10 10
11 11 import collections
12 12 import copy
13 13 import difflib
14 14 import email
15 15 import errno
16 16 import hashlib
17 17 import os
18 18 import posixpath
19 19 import re
20 20 import shutil
21 21 import tempfile
22 22 import zlib
23 23
24 24 from .i18n import _
25 25 from .node import (
26 26 hex,
27 27 short,
28 28 )
29 29 from . import (
30 30 copies,
31 31 encoding,
32 32 error,
33 33 mail,
34 34 mdiff,
35 35 pathutil,
36 36 policy,
37 37 pycompat,
38 38 scmutil,
39 39 similar,
40 40 util,
41 41 vfs as vfsmod,
42 42 )
43 43
44 44 diffhelpers = policy.importmod(r'diffhelpers')
45 45 stringio = util.stringio
46 46
47 47 gitre = re.compile(br'diff --git a/(.*) b/(.*)')
48 48 tabsplitter = re.compile(br'(\t+|[^\t]+)')
49 _nonwordre = re.compile(br'([^a-zA-Z0-9_\x80-\xff])')
49 50
50 51 PatchError = error.PatchError
51 52
52 53 # public functions
53 54
54 55 def split(stream):
55 56 '''return an iterator of individual patches from a stream'''
56 57 def isheader(line, inheader):
57 58 if inheader and line[0] in (' ', '\t'):
58 59 # continuation
59 60 return True
60 61 if line[0] in (' ', '-', '+'):
61 62 # diff line - don't check for header pattern in there
62 63 return False
63 64 l = line.split(': ', 1)
64 65 return len(l) == 2 and ' ' not in l[0]
65 66
66 67 def chunk(lines):
67 68 return stringio(''.join(lines))
68 69
69 70 def hgsplit(stream, cur):
70 71 inheader = True
71 72
72 73 for line in stream:
73 74 if not line.strip():
74 75 inheader = False
75 76 if not inheader and line.startswith('# HG changeset patch'):
76 77 yield chunk(cur)
77 78 cur = []
78 79 inheader = True
79 80
80 81 cur.append(line)
81 82
82 83 if cur:
83 84 yield chunk(cur)
84 85
85 86 def mboxsplit(stream, cur):
86 87 for line in stream:
87 88 if line.startswith('From '):
88 89 for c in split(chunk(cur[1:])):
89 90 yield c
90 91 cur = []
91 92
92 93 cur.append(line)
93 94
94 95 if cur:
95 96 for c in split(chunk(cur[1:])):
96 97 yield c
97 98
98 99 def mimesplit(stream, cur):
99 100 def msgfp(m):
100 101 fp = stringio()
101 102 g = email.Generator.Generator(fp, mangle_from_=False)
102 103 g.flatten(m)
103 104 fp.seek(0)
104 105 return fp
105 106
106 107 for line in stream:
107 108 cur.append(line)
108 109 c = chunk(cur)
109 110
110 111 m = email.Parser.Parser().parse(c)
111 112 if not m.is_multipart():
112 113 yield msgfp(m)
113 114 else:
114 115 ok_types = ('text/plain', 'text/x-diff', 'text/x-patch')
115 116 for part in m.walk():
116 117 ct = part.get_content_type()
117 118 if ct not in ok_types:
118 119 continue
119 120 yield msgfp(part)
120 121
121 122 def headersplit(stream, cur):
122 123 inheader = False
123 124
124 125 for line in stream:
125 126 if not inheader and isheader(line, inheader):
126 127 yield chunk(cur)
127 128 cur = []
128 129 inheader = True
129 130 if inheader and not isheader(line, inheader):
130 131 inheader = False
131 132
132 133 cur.append(line)
133 134
134 135 if cur:
135 136 yield chunk(cur)
136 137
137 138 def remainder(cur):
138 139 yield chunk(cur)
139 140
140 141 class fiter(object):
141 142 def __init__(self, fp):
142 143 self.fp = fp
143 144
144 145 def __iter__(self):
145 146 return self
146 147
147 148 def next(self):
148 149 l = self.fp.readline()
149 150 if not l:
150 151 raise StopIteration
151 152 return l
152 153
153 154 __next__ = next
154 155
155 156 inheader = False
156 157 cur = []
157 158
158 159 mimeheaders = ['content-type']
159 160
160 161 if not util.safehasattr(stream, 'next'):
161 162 # http responses, for example, have readline but not next
162 163 stream = fiter(stream)
163 164
164 165 for line in stream:
165 166 cur.append(line)
166 167 if line.startswith('# HG changeset patch'):
167 168 return hgsplit(stream, cur)
168 169 elif line.startswith('From '):
169 170 return mboxsplit(stream, cur)
170 171 elif isheader(line, inheader):
171 172 inheader = True
172 173 if line.split(':', 1)[0].lower() in mimeheaders:
173 174 # let email parser handle this
174 175 return mimesplit(stream, cur)
175 176 elif line.startswith('--- ') and inheader:
176 177 # No evil headers seen by diff start, split by hand
177 178 return headersplit(stream, cur)
178 179 # Not enough info, keep reading
179 180
180 181 # if we are here, we have a very plain patch
181 182 return remainder(cur)
182 183
183 184 ## Some facility for extensible patch parsing:
184 185 # list of pairs ("header to match", "data key")
185 186 patchheadermap = [('Date', 'date'),
186 187 ('Branch', 'branch'),
187 188 ('Node ID', 'nodeid'),
188 189 ]
189 190
190 191 def extract(ui, fileobj):
191 192 '''extract patch from data read from fileobj.
192 193
193 194 patch can be a normal patch or contained in an email message.
194 195
195 196 return a dictionary. Standard keys are:
196 197 - filename,
197 198 - message,
198 199 - user,
199 200 - date,
200 201 - branch,
201 202 - node,
202 203 - p1,
203 204 - p2.
204 205 Any item can be missing from the dictionary. If filename is missing,
205 206 fileobj did not contain a patch. Caller must unlink filename when done.'''
206 207
207 208 # attempt to detect the start of a patch
208 209 # (this heuristic is borrowed from quilt)
209 210 diffre = re.compile(br'^(?:Index:[ \t]|diff[ \t]-|RCS file: |'
210 211 br'retrieving revision [0-9]+(\.[0-9]+)*$|'
211 212 br'---[ \t].*?^\+\+\+[ \t]|'
212 213 br'\*\*\*[ \t].*?^---[ \t])',
213 214 re.MULTILINE | re.DOTALL)
214 215
215 216 data = {}
216 217 fd, tmpname = tempfile.mkstemp(prefix='hg-patch-')
217 218 tmpfp = os.fdopen(fd, pycompat.sysstr('w'))
218 219 try:
219 220 msg = email.Parser.Parser().parse(fileobj)
220 221
221 222 subject = msg['Subject'] and mail.headdecode(msg['Subject'])
222 223 data['user'] = msg['From'] and mail.headdecode(msg['From'])
223 224 if not subject and not data['user']:
224 225 # Not an email, restore parsed headers if any
225 226 subject = '\n'.join(': '.join(h) for h in msg.items()) + '\n'
226 227
227 228 # should try to parse msg['Date']
228 229 parents = []
229 230
230 231 if subject:
231 232 if subject.startswith('[PATCH'):
232 233 pend = subject.find(']')
233 234 if pend >= 0:
234 235 subject = subject[pend + 1:].lstrip()
235 236 subject = re.sub(br'\n[ \t]+', ' ', subject)
236 237 ui.debug('Subject: %s\n' % subject)
237 238 if data['user']:
238 239 ui.debug('From: %s\n' % data['user'])
239 240 diffs_seen = 0
240 241 ok_types = ('text/plain', 'text/x-diff', 'text/x-patch')
241 242 message = ''
242 243 for part in msg.walk():
243 244 content_type = part.get_content_type()
244 245 ui.debug('Content-Type: %s\n' % content_type)
245 246 if content_type not in ok_types:
246 247 continue
247 248 payload = part.get_payload(decode=True)
248 249 m = diffre.search(payload)
249 250 if m:
250 251 hgpatch = False
251 252 hgpatchheader = False
252 253 ignoretext = False
253 254
254 255 ui.debug('found patch at byte %d\n' % m.start(0))
255 256 diffs_seen += 1
256 257 cfp = stringio()
257 258 for line in payload[:m.start(0)].splitlines():
258 259 if line.startswith('# HG changeset patch') and not hgpatch:
259 260 ui.debug('patch generated by hg export\n')
260 261 hgpatch = True
261 262 hgpatchheader = True
262 263 # drop earlier commit message content
263 264 cfp.seek(0)
264 265 cfp.truncate()
265 266 subject = None
266 267 elif hgpatchheader:
267 268 if line.startswith('# User '):
268 269 data['user'] = line[7:]
269 270 ui.debug('From: %s\n' % data['user'])
270 271 elif line.startswith("# Parent "):
271 272 parents.append(line[9:].lstrip())
272 273 elif line.startswith("# "):
273 274 for header, key in patchheadermap:
274 275 prefix = '# %s ' % header
275 276 if line.startswith(prefix):
276 277 data[key] = line[len(prefix):]
277 278 else:
278 279 hgpatchheader = False
279 280 elif line == '---':
280 281 ignoretext = True
281 282 if not hgpatchheader and not ignoretext:
282 283 cfp.write(line)
283 284 cfp.write('\n')
284 285 message = cfp.getvalue()
285 286 if tmpfp:
286 287 tmpfp.write(payload)
287 288 if not payload.endswith('\n'):
288 289 tmpfp.write('\n')
289 290 elif not diffs_seen and message and content_type == 'text/plain':
290 291 message += '\n' + payload
291 292 except: # re-raises
292 293 tmpfp.close()
293 294 os.unlink(tmpname)
294 295 raise
295 296
296 297 if subject and not message.startswith(subject):
297 298 message = '%s\n%s' % (subject, message)
298 299 data['message'] = message
299 300 tmpfp.close()
300 301 if parents:
301 302 data['p1'] = parents.pop(0)
302 303 if parents:
303 304 data['p2'] = parents.pop(0)
304 305
305 306 if diffs_seen:
306 307 data['filename'] = tmpname
307 308 else:
308 309 os.unlink(tmpname)
309 310 return data
310 311
311 312 class patchmeta(object):
312 313 """Patched file metadata
313 314
314 315 'op' is the performed operation within ADD, DELETE, RENAME, MODIFY
315 316 or COPY. 'path' is patched file path. 'oldpath' is set to the
316 317 origin file when 'op' is either COPY or RENAME, None otherwise. If
317 318 file mode is changed, 'mode' is a tuple (islink, isexec) where
318 319 'islink' is True if the file is a symlink and 'isexec' is True if
319 320 the file is executable. Otherwise, 'mode' is None.
320 321 """
321 322 def __init__(self, path):
322 323 self.path = path
323 324 self.oldpath = None
324 325 self.mode = None
325 326 self.op = 'MODIFY'
326 327 self.binary = False
327 328
328 329 def setmode(self, mode):
329 330 islink = mode & 0o20000
330 331 isexec = mode & 0o100
331 332 self.mode = (islink, isexec)
332 333
333 334 def copy(self):
334 335 other = patchmeta(self.path)
335 336 other.oldpath = self.oldpath
336 337 other.mode = self.mode
337 338 other.op = self.op
338 339 other.binary = self.binary
339 340 return other
340 341
341 342 def _ispatchinga(self, afile):
342 343 if afile == '/dev/null':
343 344 return self.op == 'ADD'
344 345 return afile == 'a/' + (self.oldpath or self.path)
345 346
346 347 def _ispatchingb(self, bfile):
347 348 if bfile == '/dev/null':
348 349 return self.op == 'DELETE'
349 350 return bfile == 'b/' + self.path
350 351
351 352 def ispatching(self, afile, bfile):
352 353 return self._ispatchinga(afile) and self._ispatchingb(bfile)
353 354
354 355 def __repr__(self):
355 356 return "<patchmeta %s %r>" % (self.op, self.path)
356 357
357 358 def readgitpatch(lr):
358 359 """extract git-style metadata about patches from <patchname>"""
359 360
360 361 # Filter patch for git information
361 362 gp = None
362 363 gitpatches = []
363 364 for line in lr:
364 365 line = line.rstrip(' \r\n')
365 366 if line.startswith('diff --git a/'):
366 367 m = gitre.match(line)
367 368 if m:
368 369 if gp:
369 370 gitpatches.append(gp)
370 371 dst = m.group(2)
371 372 gp = patchmeta(dst)
372 373 elif gp:
373 374 if line.startswith('--- '):
374 375 gitpatches.append(gp)
375 376 gp = None
376 377 continue
377 378 if line.startswith('rename from '):
378 379 gp.op = 'RENAME'
379 380 gp.oldpath = line[12:]
380 381 elif line.startswith('rename to '):
381 382 gp.path = line[10:]
382 383 elif line.startswith('copy from '):
383 384 gp.op = 'COPY'
384 385 gp.oldpath = line[10:]
385 386 elif line.startswith('copy to '):
386 387 gp.path = line[8:]
387 388 elif line.startswith('deleted file'):
388 389 gp.op = 'DELETE'
389 390 elif line.startswith('new file mode '):
390 391 gp.op = 'ADD'
391 392 gp.setmode(int(line[-6:], 8))
392 393 elif line.startswith('new mode '):
393 394 gp.setmode(int(line[-6:], 8))
394 395 elif line.startswith('GIT binary patch'):
395 396 gp.binary = True
396 397 if gp:
397 398 gitpatches.append(gp)
398 399
399 400 return gitpatches
400 401
401 402 class linereader(object):
402 403 # simple class to allow pushing lines back into the input stream
403 404 def __init__(self, fp):
404 405 self.fp = fp
405 406 self.buf = []
406 407
407 408 def push(self, line):
408 409 if line is not None:
409 410 self.buf.append(line)
410 411
411 412 def readline(self):
412 413 if self.buf:
413 414 l = self.buf[0]
414 415 del self.buf[0]
415 416 return l
416 417 return self.fp.readline()
417 418
418 419 def __iter__(self):
419 420 return iter(self.readline, '')
420 421
421 422 class abstractbackend(object):
422 423 def __init__(self, ui):
423 424 self.ui = ui
424 425
425 426 def getfile(self, fname):
426 427 """Return target file data and flags as a (data, (islink,
427 428 isexec)) tuple. Data is None if file is missing/deleted.
428 429 """
429 430 raise NotImplementedError
430 431
431 432 def setfile(self, fname, data, mode, copysource):
432 433 """Write data to target file fname and set its mode. mode is a
433 434 (islink, isexec) tuple. If data is None, the file content should
434 435 be left unchanged. If the file is modified after being copied,
435 436 copysource is set to the original file name.
436 437 """
437 438 raise NotImplementedError
438 439
439 440 def unlink(self, fname):
440 441 """Unlink target file."""
441 442 raise NotImplementedError
442 443
443 444 def writerej(self, fname, failed, total, lines):
444 445 """Write rejected lines for fname. total is the number of hunks
445 446 which failed to apply and total the total number of hunks for this
446 447 files.
447 448 """
448 449
449 450 def exists(self, fname):
450 451 raise NotImplementedError
451 452
452 453 def close(self):
453 454 raise NotImplementedError
454 455
455 456 class fsbackend(abstractbackend):
456 457 def __init__(self, ui, basedir):
457 458 super(fsbackend, self).__init__(ui)
458 459 self.opener = vfsmod.vfs(basedir)
459 460
460 461 def getfile(self, fname):
461 462 if self.opener.islink(fname):
462 463 return (self.opener.readlink(fname), (True, False))
463 464
464 465 isexec = False
465 466 try:
466 467 isexec = self.opener.lstat(fname).st_mode & 0o100 != 0
467 468 except OSError as e:
468 469 if e.errno != errno.ENOENT:
469 470 raise
470 471 try:
471 472 return (self.opener.read(fname), (False, isexec))
472 473 except IOError as e:
473 474 if e.errno != errno.ENOENT:
474 475 raise
475 476 return None, None
476 477
477 478 def setfile(self, fname, data, mode, copysource):
478 479 islink, isexec = mode
479 480 if data is None:
480 481 self.opener.setflags(fname, islink, isexec)
481 482 return
482 483 if islink:
483 484 self.opener.symlink(data, fname)
484 485 else:
485 486 self.opener.write(fname, data)
486 487 if isexec:
487 488 self.opener.setflags(fname, False, True)
488 489
489 490 def unlink(self, fname):
490 491 self.opener.unlinkpath(fname, ignoremissing=True)
491 492
492 493 def writerej(self, fname, failed, total, lines):
493 494 fname = fname + ".rej"
494 495 self.ui.warn(
495 496 _("%d out of %d hunks FAILED -- saving rejects to file %s\n") %
496 497 (failed, total, fname))
497 498 fp = self.opener(fname, 'w')
498 499 fp.writelines(lines)
499 500 fp.close()
500 501
501 502 def exists(self, fname):
502 503 return self.opener.lexists(fname)
503 504
504 505 class workingbackend(fsbackend):
505 506 def __init__(self, ui, repo, similarity):
506 507 super(workingbackend, self).__init__(ui, repo.root)
507 508 self.repo = repo
508 509 self.similarity = similarity
509 510 self.removed = set()
510 511 self.changed = set()
511 512 self.copied = []
512 513
513 514 def _checkknown(self, fname):
514 515 if self.repo.dirstate[fname] == '?' and self.exists(fname):
515 516 raise PatchError(_('cannot patch %s: file is not tracked') % fname)
516 517
517 518 def setfile(self, fname, data, mode, copysource):
518 519 self._checkknown(fname)
519 520 super(workingbackend, self).setfile(fname, data, mode, copysource)
520 521 if copysource is not None:
521 522 self.copied.append((copysource, fname))
522 523 self.changed.add(fname)
523 524
524 525 def unlink(self, fname):
525 526 self._checkknown(fname)
526 527 super(workingbackend, self).unlink(fname)
527 528 self.removed.add(fname)
528 529 self.changed.add(fname)
529 530
530 531 def close(self):
531 532 wctx = self.repo[None]
532 533 changed = set(self.changed)
533 534 for src, dst in self.copied:
534 535 scmutil.dirstatecopy(self.ui, self.repo, wctx, src, dst)
535 536 if self.removed:
536 537 wctx.forget(sorted(self.removed))
537 538 for f in self.removed:
538 539 if f not in self.repo.dirstate:
539 540 # File was deleted and no longer belongs to the
540 541 # dirstate, it was probably marked added then
541 542 # deleted, and should not be considered by
542 543 # marktouched().
543 544 changed.discard(f)
544 545 if changed:
545 546 scmutil.marktouched(self.repo, changed, self.similarity)
546 547 return sorted(self.changed)
547 548
548 549 class filestore(object):
549 550 def __init__(self, maxsize=None):
550 551 self.opener = None
551 552 self.files = {}
552 553 self.created = 0
553 554 self.maxsize = maxsize
554 555 if self.maxsize is None:
555 556 self.maxsize = 4*(2**20)
556 557 self.size = 0
557 558 self.data = {}
558 559
559 560 def setfile(self, fname, data, mode, copied=None):
560 561 if self.maxsize < 0 or (len(data) + self.size) <= self.maxsize:
561 562 self.data[fname] = (data, mode, copied)
562 563 self.size += len(data)
563 564 else:
564 565 if self.opener is None:
565 566 root = tempfile.mkdtemp(prefix='hg-patch-')
566 567 self.opener = vfsmod.vfs(root)
567 568 # Avoid filename issues with these simple names
568 569 fn = str(self.created)
569 570 self.opener.write(fn, data)
570 571 self.created += 1
571 572 self.files[fname] = (fn, mode, copied)
572 573
573 574 def getfile(self, fname):
574 575 if fname in self.data:
575 576 return self.data[fname]
576 577 if not self.opener or fname not in self.files:
577 578 return None, None, None
578 579 fn, mode, copied = self.files[fname]
579 580 return self.opener.read(fn), mode, copied
580 581
581 582 def close(self):
582 583 if self.opener:
583 584 shutil.rmtree(self.opener.base)
584 585
585 586 class repobackend(abstractbackend):
586 587 def __init__(self, ui, repo, ctx, store):
587 588 super(repobackend, self).__init__(ui)
588 589 self.repo = repo
589 590 self.ctx = ctx
590 591 self.store = store
591 592 self.changed = set()
592 593 self.removed = set()
593 594 self.copied = {}
594 595
595 596 def _checkknown(self, fname):
596 597 if fname not in self.ctx:
597 598 raise PatchError(_('cannot patch %s: file is not tracked') % fname)
598 599
599 600 def getfile(self, fname):
600 601 try:
601 602 fctx = self.ctx[fname]
602 603 except error.LookupError:
603 604 return None, None
604 605 flags = fctx.flags()
605 606 return fctx.data(), ('l' in flags, 'x' in flags)
606 607
607 608 def setfile(self, fname, data, mode, copysource):
608 609 if copysource:
609 610 self._checkknown(copysource)
610 611 if data is None:
611 612 data = self.ctx[fname].data()
612 613 self.store.setfile(fname, data, mode, copysource)
613 614 self.changed.add(fname)
614 615 if copysource:
615 616 self.copied[fname] = copysource
616 617
617 618 def unlink(self, fname):
618 619 self._checkknown(fname)
619 620 self.removed.add(fname)
620 621
621 622 def exists(self, fname):
622 623 return fname in self.ctx
623 624
624 625 def close(self):
625 626 return self.changed | self.removed
626 627
627 628 # @@ -start,len +start,len @@ or @@ -start +start @@ if len is 1
628 629 unidesc = re.compile('@@ -(\d+)(?:,(\d+))? \+(\d+)(?:,(\d+))? @@')
629 630 contextdesc = re.compile('(?:---|\*\*\*) (\d+)(?:,(\d+))? (?:---|\*\*\*)')
630 631 eolmodes = ['strict', 'crlf', 'lf', 'auto']
631 632
632 633 class patchfile(object):
633 634 def __init__(self, ui, gp, backend, store, eolmode='strict'):
634 635 self.fname = gp.path
635 636 self.eolmode = eolmode
636 637 self.eol = None
637 638 self.backend = backend
638 639 self.ui = ui
639 640 self.lines = []
640 641 self.exists = False
641 642 self.missing = True
642 643 self.mode = gp.mode
643 644 self.copysource = gp.oldpath
644 645 self.create = gp.op in ('ADD', 'COPY', 'RENAME')
645 646 self.remove = gp.op == 'DELETE'
646 647 if self.copysource is None:
647 648 data, mode = backend.getfile(self.fname)
648 649 else:
649 650 data, mode = store.getfile(self.copysource)[:2]
650 651 if data is not None:
651 652 self.exists = self.copysource is None or backend.exists(self.fname)
652 653 self.missing = False
653 654 if data:
654 655 self.lines = mdiff.splitnewlines(data)
655 656 if self.mode is None:
656 657 self.mode = mode
657 658 if self.lines:
658 659 # Normalize line endings
659 660 if self.lines[0].endswith('\r\n'):
660 661 self.eol = '\r\n'
661 662 elif self.lines[0].endswith('\n'):
662 663 self.eol = '\n'
663 664 if eolmode != 'strict':
664 665 nlines = []
665 666 for l in self.lines:
666 667 if l.endswith('\r\n'):
667 668 l = l[:-2] + '\n'
668 669 nlines.append(l)
669 670 self.lines = nlines
670 671 else:
671 672 if self.create:
672 673 self.missing = False
673 674 if self.mode is None:
674 675 self.mode = (False, False)
675 676 if self.missing:
676 677 self.ui.warn(_("unable to find '%s' for patching\n") % self.fname)
677 678 self.ui.warn(_("(use '--prefix' to apply patch relative to the "
678 679 "current directory)\n"))
679 680
680 681 self.hash = {}
681 682 self.dirty = 0
682 683 self.offset = 0
683 684 self.skew = 0
684 685 self.rej = []
685 686 self.fileprinted = False
686 687 self.printfile(False)
687 688 self.hunks = 0
688 689
689 690 def writelines(self, fname, lines, mode):
690 691 if self.eolmode == 'auto':
691 692 eol = self.eol
692 693 elif self.eolmode == 'crlf':
693 694 eol = '\r\n'
694 695 else:
695 696 eol = '\n'
696 697
697 698 if self.eolmode != 'strict' and eol and eol != '\n':
698 699 rawlines = []
699 700 for l in lines:
700 701 if l and l[-1] == '\n':
701 702 l = l[:-1] + eol
702 703 rawlines.append(l)
703 704 lines = rawlines
704 705
705 706 self.backend.setfile(fname, ''.join(lines), mode, self.copysource)
706 707
707 708 def printfile(self, warn):
708 709 if self.fileprinted:
709 710 return
710 711 if warn or self.ui.verbose:
711 712 self.fileprinted = True
712 713 s = _("patching file %s\n") % self.fname
713 714 if warn:
714 715 self.ui.warn(s)
715 716 else:
716 717 self.ui.note(s)
717 718
718 719
719 720 def findlines(self, l, linenum):
720 721 # looks through the hash and finds candidate lines. The
721 722 # result is a list of line numbers sorted based on distance
722 723 # from linenum
723 724
724 725 cand = self.hash.get(l, [])
725 726 if len(cand) > 1:
726 727 # resort our list of potentials forward then back.
727 728 cand.sort(key=lambda x: abs(x - linenum))
728 729 return cand
729 730
730 731 def write_rej(self):
731 732 # our rejects are a little different from patch(1). This always
732 733 # creates rejects in the same form as the original patch. A file
733 734 # header is inserted so that you can run the reject through patch again
734 735 # without having to type the filename.
735 736 if not self.rej:
736 737 return
737 738 base = os.path.basename(self.fname)
738 739 lines = ["--- %s\n+++ %s\n" % (base, base)]
739 740 for x in self.rej:
740 741 for l in x.hunk:
741 742 lines.append(l)
742 743 if l[-1:] != '\n':
743 744 lines.append("\n\ No newline at end of file\n")
744 745 self.backend.writerej(self.fname, len(self.rej), self.hunks, lines)
745 746
746 747 def apply(self, h):
747 748 if not h.complete():
748 749 raise PatchError(_("bad hunk #%d %s (%d %d %d %d)") %
749 750 (h.number, h.desc, len(h.a), h.lena, len(h.b),
750 751 h.lenb))
751 752
752 753 self.hunks += 1
753 754
754 755 if self.missing:
755 756 self.rej.append(h)
756 757 return -1
757 758
758 759 if self.exists and self.create:
759 760 if self.copysource:
760 761 self.ui.warn(_("cannot create %s: destination already "
761 762 "exists\n") % self.fname)
762 763 else:
763 764 self.ui.warn(_("file %s already exists\n") % self.fname)
764 765 self.rej.append(h)
765 766 return -1
766 767
767 768 if isinstance(h, binhunk):
768 769 if self.remove:
769 770 self.backend.unlink(self.fname)
770 771 else:
771 772 l = h.new(self.lines)
772 773 self.lines[:] = l
773 774 self.offset += len(l)
774 775 self.dirty = True
775 776 return 0
776 777
777 778 horig = h
778 779 if (self.eolmode in ('crlf', 'lf')
779 780 or self.eolmode == 'auto' and self.eol):
780 781 # If new eols are going to be normalized, then normalize
781 782 # hunk data before patching. Otherwise, preserve input
782 783 # line-endings.
783 784 h = h.getnormalized()
784 785
785 786 # fast case first, no offsets, no fuzz
786 787 old, oldstart, new, newstart = h.fuzzit(0, False)
787 788 oldstart += self.offset
788 789 orig_start = oldstart
789 790 # if there's skew we want to emit the "(offset %d lines)" even
790 791 # when the hunk cleanly applies at start + skew, so skip the
791 792 # fast case code
792 793 if (self.skew == 0 and
793 794 diffhelpers.testhunk(old, self.lines, oldstart) == 0):
794 795 if self.remove:
795 796 self.backend.unlink(self.fname)
796 797 else:
797 798 self.lines[oldstart:oldstart + len(old)] = new
798 799 self.offset += len(new) - len(old)
799 800 self.dirty = True
800 801 return 0
801 802
802 803 # ok, we couldn't match the hunk. Lets look for offsets and fuzz it
803 804 self.hash = {}
804 805 for x, s in enumerate(self.lines):
805 806 self.hash.setdefault(s, []).append(x)
806 807
807 808 for fuzzlen in xrange(self.ui.configint("patch", "fuzz") + 1):
808 809 for toponly in [True, False]:
809 810 old, oldstart, new, newstart = h.fuzzit(fuzzlen, toponly)
810 811 oldstart = oldstart + self.offset + self.skew
811 812 oldstart = min(oldstart, len(self.lines))
812 813 if old:
813 814 cand = self.findlines(old[0][1:], oldstart)
814 815 else:
815 816 # Only adding lines with no or fuzzed context, just
816 817 # take the skew in account
817 818 cand = [oldstart]
818 819
819 820 for l in cand:
820 821 if not old or diffhelpers.testhunk(old, self.lines, l) == 0:
821 822 self.lines[l : l + len(old)] = new
822 823 self.offset += len(new) - len(old)
823 824 self.skew = l - orig_start
824 825 self.dirty = True
825 826 offset = l - orig_start - fuzzlen
826 827 if fuzzlen:
827 828 msg = _("Hunk #%d succeeded at %d "
828 829 "with fuzz %d "
829 830 "(offset %d lines).\n")
830 831 self.printfile(True)
831 832 self.ui.warn(msg %
832 833 (h.number, l + 1, fuzzlen, offset))
833 834 else:
834 835 msg = _("Hunk #%d succeeded at %d "
835 836 "(offset %d lines).\n")
836 837 self.ui.note(msg % (h.number, l + 1, offset))
837 838 return fuzzlen
838 839 self.printfile(True)
839 840 self.ui.warn(_("Hunk #%d FAILED at %d\n") % (h.number, orig_start))
840 841 self.rej.append(horig)
841 842 return -1
842 843
843 844 def close(self):
844 845 if self.dirty:
845 846 self.writelines(self.fname, self.lines, self.mode)
846 847 self.write_rej()
847 848 return len(self.rej)
848 849
849 850 class header(object):
850 851 """patch header
851 852 """
852 853 diffgit_re = re.compile('diff --git a/(.*) b/(.*)$')
853 854 diff_re = re.compile('diff -r .* (.*)$')
854 855 allhunks_re = re.compile('(?:index|deleted file) ')
855 856 pretty_re = re.compile('(?:new file|deleted file) ')
856 857 special_re = re.compile('(?:index|deleted|copy|rename) ')
857 858 newfile_re = re.compile('(?:new file)')
858 859
859 860 def __init__(self, header):
860 861 self.header = header
861 862 self.hunks = []
862 863
863 864 def binary(self):
864 865 return any(h.startswith('index ') for h in self.header)
865 866
866 867 def pretty(self, fp):
867 868 for h in self.header:
868 869 if h.startswith('index '):
869 870 fp.write(_('this modifies a binary file (all or nothing)\n'))
870 871 break
871 872 if self.pretty_re.match(h):
872 873 fp.write(h)
873 874 if self.binary():
874 875 fp.write(_('this is a binary file\n'))
875 876 break
876 877 if h.startswith('---'):
877 878 fp.write(_('%d hunks, %d lines changed\n') %
878 879 (len(self.hunks),
879 880 sum([max(h.added, h.removed) for h in self.hunks])))
880 881 break
881 882 fp.write(h)
882 883
883 884 def write(self, fp):
884 885 fp.write(''.join(self.header))
885 886
886 887 def allhunks(self):
887 888 return any(self.allhunks_re.match(h) for h in self.header)
888 889
889 890 def files(self):
890 891 match = self.diffgit_re.match(self.header[0])
891 892 if match:
892 893 fromfile, tofile = match.groups()
893 894 if fromfile == tofile:
894 895 return [fromfile]
895 896 return [fromfile, tofile]
896 897 else:
897 898 return self.diff_re.match(self.header[0]).groups()
898 899
899 900 def filename(self):
900 901 return self.files()[-1]
901 902
902 903 def __repr__(self):
903 904 return '<header %s>' % (' '.join(map(repr, self.files())))
904 905
905 906 def isnewfile(self):
906 907 return any(self.newfile_re.match(h) for h in self.header)
907 908
908 909 def special(self):
909 910 # Special files are shown only at the header level and not at the hunk
910 911 # level for example a file that has been deleted is a special file.
911 912 # The user cannot change the content of the operation, in the case of
912 913 # the deleted file he has to take the deletion or not take it, he
913 914 # cannot take some of it.
914 915 # Newly added files are special if they are empty, they are not special
915 916 # if they have some content as we want to be able to change it
916 917 nocontent = len(self.header) == 2
917 918 emptynewfile = self.isnewfile() and nocontent
918 919 return emptynewfile or \
919 920 any(self.special_re.match(h) for h in self.header)
920 921
921 922 class recordhunk(object):
922 923 """patch hunk
923 924
924 925 XXX shouldn't we merge this with the other hunk class?
925 926 """
926 927
927 928 def __init__(self, header, fromline, toline, proc, before, hunk, after,
928 929 maxcontext=None):
929 930 def trimcontext(lines, reverse=False):
930 931 if maxcontext is not None:
931 932 delta = len(lines) - maxcontext
932 933 if delta > 0:
933 934 if reverse:
934 935 return delta, lines[delta:]
935 936 else:
936 937 return delta, lines[:maxcontext]
937 938 return 0, lines
938 939
939 940 self.header = header
940 941 trimedbefore, self.before = trimcontext(before, True)
941 942 self.fromline = fromline + trimedbefore
942 943 self.toline = toline + trimedbefore
943 944 _trimedafter, self.after = trimcontext(after, False)
944 945 self.proc = proc
945 946 self.hunk = hunk
946 947 self.added, self.removed = self.countchanges(self.hunk)
947 948
948 949 def __eq__(self, v):
949 950 if not isinstance(v, recordhunk):
950 951 return False
951 952
952 953 return ((v.hunk == self.hunk) and
953 954 (v.proc == self.proc) and
954 955 (self.fromline == v.fromline) and
955 956 (self.header.files() == v.header.files()))
956 957
957 958 def __hash__(self):
958 959 return hash((tuple(self.hunk),
959 960 tuple(self.header.files()),
960 961 self.fromline,
961 962 self.proc))
962 963
963 964 def countchanges(self, hunk):
964 965 """hunk -> (n+,n-)"""
965 966 add = len([h for h in hunk if h.startswith('+')])
966 967 rem = len([h for h in hunk if h.startswith('-')])
967 968 return add, rem
968 969
969 970 def reversehunk(self):
970 971 """return another recordhunk which is the reverse of the hunk
971 972
972 973 If this hunk is diff(A, B), the returned hunk is diff(B, A). To do
973 974 that, swap fromline/toline and +/- signs while keep other things
974 975 unchanged.
975 976 """
976 977 m = {'+': '-', '-': '+', '\\': '\\'}
977 978 hunk = ['%s%s' % (m[l[0:1]], l[1:]) for l in self.hunk]
978 979 return recordhunk(self.header, self.toline, self.fromline, self.proc,
979 980 self.before, hunk, self.after)
980 981
981 982 def write(self, fp):
982 983 delta = len(self.before) + len(self.after)
983 984 if self.after and self.after[-1] == '\\ No newline at end of file\n':
984 985 delta -= 1
985 986 fromlen = delta + self.removed
986 987 tolen = delta + self.added
987 988 fp.write('@@ -%d,%d +%d,%d @@%s\n' %
988 989 (self.fromline, fromlen, self.toline, tolen,
989 990 self.proc and (' ' + self.proc)))
990 991 fp.write(''.join(self.before + self.hunk + self.after))
991 992
992 993 pretty = write
993 994
994 995 def filename(self):
995 996 return self.header.filename()
996 997
997 998 def __repr__(self):
998 999 return '<hunk %r@%d>' % (self.filename(), self.fromline)
999 1000
1000 1001 def getmessages():
1001 1002 return {
1002 1003 'multiple': {
1003 1004 'apply': _("apply change %d/%d to '%s'?"),
1004 1005 'discard': _("discard change %d/%d to '%s'?"),
1005 1006 'record': _("record change %d/%d to '%s'?"),
1006 1007 },
1007 1008 'single': {
1008 1009 'apply': _("apply this change to '%s'?"),
1009 1010 'discard': _("discard this change to '%s'?"),
1010 1011 'record': _("record this change to '%s'?"),
1011 1012 },
1012 1013 'help': {
1013 1014 'apply': _('[Ynesfdaq?]'
1014 1015 '$$ &Yes, apply this change'
1015 1016 '$$ &No, skip this change'
1016 1017 '$$ &Edit this change manually'
1017 1018 '$$ &Skip remaining changes to this file'
1018 1019 '$$ Apply remaining changes to this &file'
1019 1020 '$$ &Done, skip remaining changes and files'
1020 1021 '$$ Apply &all changes to all remaining files'
1021 1022 '$$ &Quit, applying no changes'
1022 1023 '$$ &? (display help)'),
1023 1024 'discard': _('[Ynesfdaq?]'
1024 1025 '$$ &Yes, discard this change'
1025 1026 '$$ &No, skip this change'
1026 1027 '$$ &Edit this change manually'
1027 1028 '$$ &Skip remaining changes to this file'
1028 1029 '$$ Discard remaining changes to this &file'
1029 1030 '$$ &Done, skip remaining changes and files'
1030 1031 '$$ Discard &all changes to all remaining files'
1031 1032 '$$ &Quit, discarding no changes'
1032 1033 '$$ &? (display help)'),
1033 1034 'record': _('[Ynesfdaq?]'
1034 1035 '$$ &Yes, record this change'
1035 1036 '$$ &No, skip this change'
1036 1037 '$$ &Edit this change manually'
1037 1038 '$$ &Skip remaining changes to this file'
1038 1039 '$$ Record remaining changes to this &file'
1039 1040 '$$ &Done, skip remaining changes and files'
1040 1041 '$$ Record &all changes to all remaining files'
1041 1042 '$$ &Quit, recording no changes'
1042 1043 '$$ &? (display help)'),
1043 1044 }
1044 1045 }
1045 1046
1046 1047 def filterpatch(ui, headers, operation=None):
1047 1048 """Interactively filter patch chunks into applied-only chunks"""
1048 1049 messages = getmessages()
1049 1050
1050 1051 if operation is None:
1051 1052 operation = 'record'
1052 1053
1053 1054 def prompt(skipfile, skipall, query, chunk):
1054 1055 """prompt query, and process base inputs
1055 1056
1056 1057 - y/n for the rest of file
1057 1058 - y/n for the rest
1058 1059 - ? (help)
1059 1060 - q (quit)
1060 1061
1061 1062 Return True/False and possibly updated skipfile and skipall.
1062 1063 """
1063 1064 newpatches = None
1064 1065 if skipall is not None:
1065 1066 return skipall, skipfile, skipall, newpatches
1066 1067 if skipfile is not None:
1067 1068 return skipfile, skipfile, skipall, newpatches
1068 1069 while True:
1069 1070 resps = messages['help'][operation]
1070 1071 r = ui.promptchoice("%s %s" % (query, resps))
1071 1072 ui.write("\n")
1072 1073 if r == 8: # ?
1073 1074 for c, t in ui.extractchoices(resps)[1]:
1074 1075 ui.write('%s - %s\n' % (c, encoding.lower(t)))
1075 1076 continue
1076 1077 elif r == 0: # yes
1077 1078 ret = True
1078 1079 elif r == 1: # no
1079 1080 ret = False
1080 1081 elif r == 2: # Edit patch
1081 1082 if chunk is None:
1082 1083 ui.write(_('cannot edit patch for whole file'))
1083 1084 ui.write("\n")
1084 1085 continue
1085 1086 if chunk.header.binary():
1086 1087 ui.write(_('cannot edit patch for binary file'))
1087 1088 ui.write("\n")
1088 1089 continue
1089 1090 # Patch comment based on the Git one (based on comment at end of
1090 1091 # https://mercurial-scm.org/wiki/RecordExtension)
1091 1092 phelp = '---' + _("""
1092 1093 To remove '-' lines, make them ' ' lines (context).
1093 1094 To remove '+' lines, delete them.
1094 1095 Lines starting with # will be removed from the patch.
1095 1096
1096 1097 If the patch applies cleanly, the edited hunk will immediately be
1097 1098 added to the record list. If it does not apply cleanly, a rejects
1098 1099 file will be generated: you can use that when you try again. If
1099 1100 all lines of the hunk are removed, then the edit is aborted and
1100 1101 the hunk is left unchanged.
1101 1102 """)
1102 1103 (patchfd, patchfn) = tempfile.mkstemp(prefix="hg-editor-",
1103 1104 suffix=".diff", text=True)
1104 1105 ncpatchfp = None
1105 1106 try:
1106 1107 # Write the initial patch
1107 1108 f = os.fdopen(patchfd, pycompat.sysstr("w"))
1108 1109 chunk.header.write(f)
1109 1110 chunk.write(f)
1110 1111 f.write('\n'.join(['# ' + i for i in phelp.splitlines()]))
1111 1112 f.close()
1112 1113 # Start the editor and wait for it to complete
1113 1114 editor = ui.geteditor()
1114 1115 ret = ui.system("%s \"%s\"" % (editor, patchfn),
1115 1116 environ={'HGUSER': ui.username()},
1116 1117 blockedtag='filterpatch')
1117 1118 if ret != 0:
1118 1119 ui.warn(_("editor exited with exit code %d\n") % ret)
1119 1120 continue
1120 1121 # Remove comment lines
1121 1122 patchfp = open(patchfn)
1122 1123 ncpatchfp = stringio()
1123 1124 for line in util.iterfile(patchfp):
1124 1125 if not line.startswith('#'):
1125 1126 ncpatchfp.write(line)
1126 1127 patchfp.close()
1127 1128 ncpatchfp.seek(0)
1128 1129 newpatches = parsepatch(ncpatchfp)
1129 1130 finally:
1130 1131 os.unlink(patchfn)
1131 1132 del ncpatchfp
1132 1133 # Signal that the chunk shouldn't be applied as-is, but
1133 1134 # provide the new patch to be used instead.
1134 1135 ret = False
1135 1136 elif r == 3: # Skip
1136 1137 ret = skipfile = False
1137 1138 elif r == 4: # file (Record remaining)
1138 1139 ret = skipfile = True
1139 1140 elif r == 5: # done, skip remaining
1140 1141 ret = skipall = False
1141 1142 elif r == 6: # all
1142 1143 ret = skipall = True
1143 1144 elif r == 7: # quit
1144 1145 raise error.Abort(_('user quit'))
1145 1146 return ret, skipfile, skipall, newpatches
1146 1147
1147 1148 seen = set()
1148 1149 applied = {} # 'filename' -> [] of chunks
1149 1150 skipfile, skipall = None, None
1150 1151 pos, total = 1, sum(len(h.hunks) for h in headers)
1151 1152 for h in headers:
1152 1153 pos += len(h.hunks)
1153 1154 skipfile = None
1154 1155 fixoffset = 0
1155 1156 hdr = ''.join(h.header)
1156 1157 if hdr in seen:
1157 1158 continue
1158 1159 seen.add(hdr)
1159 1160 if skipall is None:
1160 1161 h.pretty(ui)
1161 1162 msg = (_('examine changes to %s?') %
1162 1163 _(' and ').join("'%s'" % f for f in h.files()))
1163 1164 r, skipfile, skipall, np = prompt(skipfile, skipall, msg, None)
1164 1165 if not r:
1165 1166 continue
1166 1167 applied[h.filename()] = [h]
1167 1168 if h.allhunks():
1168 1169 applied[h.filename()] += h.hunks
1169 1170 continue
1170 1171 for i, chunk in enumerate(h.hunks):
1171 1172 if skipfile is None and skipall is None:
1172 1173 chunk.pretty(ui)
1173 1174 if total == 1:
1174 1175 msg = messages['single'][operation] % chunk.filename()
1175 1176 else:
1176 1177 idx = pos - len(h.hunks) + i
1177 1178 msg = messages['multiple'][operation] % (idx, total,
1178 1179 chunk.filename())
1179 1180 r, skipfile, skipall, newpatches = prompt(skipfile,
1180 1181 skipall, msg, chunk)
1181 1182 if r:
1182 1183 if fixoffset:
1183 1184 chunk = copy.copy(chunk)
1184 1185 chunk.toline += fixoffset
1185 1186 applied[chunk.filename()].append(chunk)
1186 1187 elif newpatches is not None:
1187 1188 for newpatch in newpatches:
1188 1189 for newhunk in newpatch.hunks:
1189 1190 if fixoffset:
1190 1191 newhunk.toline += fixoffset
1191 1192 applied[newhunk.filename()].append(newhunk)
1192 1193 else:
1193 1194 fixoffset += chunk.removed - chunk.added
1194 1195 return (sum([h for h in applied.itervalues()
1195 1196 if h[0].special() or len(h) > 1], []), {})
1196 1197 class hunk(object):
1197 1198 def __init__(self, desc, num, lr, context):
1198 1199 self.number = num
1199 1200 self.desc = desc
1200 1201 self.hunk = [desc]
1201 1202 self.a = []
1202 1203 self.b = []
1203 1204 self.starta = self.lena = None
1204 1205 self.startb = self.lenb = None
1205 1206 if lr is not None:
1206 1207 if context:
1207 1208 self.read_context_hunk(lr)
1208 1209 else:
1209 1210 self.read_unified_hunk(lr)
1210 1211
1211 1212 def getnormalized(self):
1212 1213 """Return a copy with line endings normalized to LF."""
1213 1214
1214 1215 def normalize(lines):
1215 1216 nlines = []
1216 1217 for line in lines:
1217 1218 if line.endswith('\r\n'):
1218 1219 line = line[:-2] + '\n'
1219 1220 nlines.append(line)
1220 1221 return nlines
1221 1222
1222 1223 # Dummy object, it is rebuilt manually
1223 1224 nh = hunk(self.desc, self.number, None, None)
1224 1225 nh.number = self.number
1225 1226 nh.desc = self.desc
1226 1227 nh.hunk = self.hunk
1227 1228 nh.a = normalize(self.a)
1228 1229 nh.b = normalize(self.b)
1229 1230 nh.starta = self.starta
1230 1231 nh.startb = self.startb
1231 1232 nh.lena = self.lena
1232 1233 nh.lenb = self.lenb
1233 1234 return nh
1234 1235
1235 1236 def read_unified_hunk(self, lr):
1236 1237 m = unidesc.match(self.desc)
1237 1238 if not m:
1238 1239 raise PatchError(_("bad hunk #%d") % self.number)
1239 1240 self.starta, self.lena, self.startb, self.lenb = m.groups()
1240 1241 if self.lena is None:
1241 1242 self.lena = 1
1242 1243 else:
1243 1244 self.lena = int(self.lena)
1244 1245 if self.lenb is None:
1245 1246 self.lenb = 1
1246 1247 else:
1247 1248 self.lenb = int(self.lenb)
1248 1249 self.starta = int(self.starta)
1249 1250 self.startb = int(self.startb)
1250 1251 diffhelpers.addlines(lr, self.hunk, self.lena, self.lenb, self.a,
1251 1252 self.b)
1252 1253 # if we hit eof before finishing out the hunk, the last line will
1253 1254 # be zero length. Lets try to fix it up.
1254 1255 while len(self.hunk[-1]) == 0:
1255 1256 del self.hunk[-1]
1256 1257 del self.a[-1]
1257 1258 del self.b[-1]
1258 1259 self.lena -= 1
1259 1260 self.lenb -= 1
1260 1261 self._fixnewline(lr)
1261 1262
1262 1263 def read_context_hunk(self, lr):
1263 1264 self.desc = lr.readline()
1264 1265 m = contextdesc.match(self.desc)
1265 1266 if not m:
1266 1267 raise PatchError(_("bad hunk #%d") % self.number)
1267 1268 self.starta, aend = m.groups()
1268 1269 self.starta = int(self.starta)
1269 1270 if aend is None:
1270 1271 aend = self.starta
1271 1272 self.lena = int(aend) - self.starta
1272 1273 if self.starta:
1273 1274 self.lena += 1
1274 1275 for x in xrange(self.lena):
1275 1276 l = lr.readline()
1276 1277 if l.startswith('---'):
1277 1278 # lines addition, old block is empty
1278 1279 lr.push(l)
1279 1280 break
1280 1281 s = l[2:]
1281 1282 if l.startswith('- ') or l.startswith('! '):
1282 1283 u = '-' + s
1283 1284 elif l.startswith(' '):
1284 1285 u = ' ' + s
1285 1286 else:
1286 1287 raise PatchError(_("bad hunk #%d old text line %d") %
1287 1288 (self.number, x))
1288 1289 self.a.append(u)
1289 1290 self.hunk.append(u)
1290 1291
1291 1292 l = lr.readline()
1292 1293 if l.startswith('\ '):
1293 1294 s = self.a[-1][:-1]
1294 1295 self.a[-1] = s
1295 1296 self.hunk[-1] = s
1296 1297 l = lr.readline()
1297 1298 m = contextdesc.match(l)
1298 1299 if not m:
1299 1300 raise PatchError(_("bad hunk #%d") % self.number)
1300 1301 self.startb, bend = m.groups()
1301 1302 self.startb = int(self.startb)
1302 1303 if bend is None:
1303 1304 bend = self.startb
1304 1305 self.lenb = int(bend) - self.startb
1305 1306 if self.startb:
1306 1307 self.lenb += 1
1307 1308 hunki = 1
1308 1309 for x in xrange(self.lenb):
1309 1310 l = lr.readline()
1310 1311 if l.startswith('\ '):
1311 1312 # XXX: the only way to hit this is with an invalid line range.
1312 1313 # The no-eol marker is not counted in the line range, but I
1313 1314 # guess there are diff(1) out there which behave differently.
1314 1315 s = self.b[-1][:-1]
1315 1316 self.b[-1] = s
1316 1317 self.hunk[hunki - 1] = s
1317 1318 continue
1318 1319 if not l:
1319 1320 # line deletions, new block is empty and we hit EOF
1320 1321 lr.push(l)
1321 1322 break
1322 1323 s = l[2:]
1323 1324 if l.startswith('+ ') or l.startswith('! '):
1324 1325 u = '+' + s
1325 1326 elif l.startswith(' '):
1326 1327 u = ' ' + s
1327 1328 elif len(self.b) == 0:
1328 1329 # line deletions, new block is empty
1329 1330 lr.push(l)
1330 1331 break
1331 1332 else:
1332 1333 raise PatchError(_("bad hunk #%d old text line %d") %
1333 1334 (self.number, x))
1334 1335 self.b.append(s)
1335 1336 while True:
1336 1337 if hunki >= len(self.hunk):
1337 1338 h = ""
1338 1339 else:
1339 1340 h = self.hunk[hunki]
1340 1341 hunki += 1
1341 1342 if h == u:
1342 1343 break
1343 1344 elif h.startswith('-'):
1344 1345 continue
1345 1346 else:
1346 1347 self.hunk.insert(hunki - 1, u)
1347 1348 break
1348 1349
1349 1350 if not self.a:
1350 1351 # this happens when lines were only added to the hunk
1351 1352 for x in self.hunk:
1352 1353 if x.startswith('-') or x.startswith(' '):
1353 1354 self.a.append(x)
1354 1355 if not self.b:
1355 1356 # this happens when lines were only deleted from the hunk
1356 1357 for x in self.hunk:
1357 1358 if x.startswith('+') or x.startswith(' '):
1358 1359 self.b.append(x[1:])
1359 1360 # @@ -start,len +start,len @@
1360 1361 self.desc = "@@ -%d,%d +%d,%d @@\n" % (self.starta, self.lena,
1361 1362 self.startb, self.lenb)
1362 1363 self.hunk[0] = self.desc
1363 1364 self._fixnewline(lr)
1364 1365
1365 1366 def _fixnewline(self, lr):
1366 1367 l = lr.readline()
1367 1368 if l.startswith('\ '):
1368 1369 diffhelpers.fix_newline(self.hunk, self.a, self.b)
1369 1370 else:
1370 1371 lr.push(l)
1371 1372
1372 1373 def complete(self):
1373 1374 return len(self.a) == self.lena and len(self.b) == self.lenb
1374 1375
1375 1376 def _fuzzit(self, old, new, fuzz, toponly):
1376 1377 # this removes context lines from the top and bottom of list 'l'. It
1377 1378 # checks the hunk to make sure only context lines are removed, and then
1378 1379 # returns a new shortened list of lines.
1379 1380 fuzz = min(fuzz, len(old))
1380 1381 if fuzz:
1381 1382 top = 0
1382 1383 bot = 0
1383 1384 hlen = len(self.hunk)
1384 1385 for x in xrange(hlen - 1):
1385 1386 # the hunk starts with the @@ line, so use x+1
1386 1387 if self.hunk[x + 1][0] == ' ':
1387 1388 top += 1
1388 1389 else:
1389 1390 break
1390 1391 if not toponly:
1391 1392 for x in xrange(hlen - 1):
1392 1393 if self.hunk[hlen - bot - 1][0] == ' ':
1393 1394 bot += 1
1394 1395 else:
1395 1396 break
1396 1397
1397 1398 bot = min(fuzz, bot)
1398 1399 top = min(fuzz, top)
1399 1400 return old[top:len(old) - bot], new[top:len(new) - bot], top
1400 1401 return old, new, 0
1401 1402
1402 1403 def fuzzit(self, fuzz, toponly):
1403 1404 old, new, top = self._fuzzit(self.a, self.b, fuzz, toponly)
1404 1405 oldstart = self.starta + top
1405 1406 newstart = self.startb + top
1406 1407 # zero length hunk ranges already have their start decremented
1407 1408 if self.lena and oldstart > 0:
1408 1409 oldstart -= 1
1409 1410 if self.lenb and newstart > 0:
1410 1411 newstart -= 1
1411 1412 return old, oldstart, new, newstart
1412 1413
1413 1414 class binhunk(object):
1414 1415 'A binary patch file.'
1415 1416 def __init__(self, lr, fname):
1416 1417 self.text = None
1417 1418 self.delta = False
1418 1419 self.hunk = ['GIT binary patch\n']
1419 1420 self._fname = fname
1420 1421 self._read(lr)
1421 1422
1422 1423 def complete(self):
1423 1424 return self.text is not None
1424 1425
1425 1426 def new(self, lines):
1426 1427 if self.delta:
1427 1428 return [applybindelta(self.text, ''.join(lines))]
1428 1429 return [self.text]
1429 1430
1430 1431 def _read(self, lr):
1431 1432 def getline(lr, hunk):
1432 1433 l = lr.readline()
1433 1434 hunk.append(l)
1434 1435 return l.rstrip('\r\n')
1435 1436
1436 1437 size = 0
1437 1438 while True:
1438 1439 line = getline(lr, self.hunk)
1439 1440 if not line:
1440 1441 raise PatchError(_('could not extract "%s" binary data')
1441 1442 % self._fname)
1442 1443 if line.startswith('literal '):
1443 1444 size = int(line[8:].rstrip())
1444 1445 break
1445 1446 if line.startswith('delta '):
1446 1447 size = int(line[6:].rstrip())
1447 1448 self.delta = True
1448 1449 break
1449 1450 dec = []
1450 1451 line = getline(lr, self.hunk)
1451 1452 while len(line) > 1:
1452 1453 l = line[0]
1453 1454 if l <= 'Z' and l >= 'A':
1454 1455 l = ord(l) - ord('A') + 1
1455 1456 else:
1456 1457 l = ord(l) - ord('a') + 27
1457 1458 try:
1458 1459 dec.append(util.b85decode(line[1:])[:l])
1459 1460 except ValueError as e:
1460 1461 raise PatchError(_('could not decode "%s" binary patch: %s')
1461 1462 % (self._fname, str(e)))
1462 1463 line = getline(lr, self.hunk)
1463 1464 text = zlib.decompress(''.join(dec))
1464 1465 if len(text) != size:
1465 1466 raise PatchError(_('"%s" length is %d bytes, should be %d')
1466 1467 % (self._fname, len(text), size))
1467 1468 self.text = text
1468 1469
1469 1470 def parsefilename(str):
1470 1471 # --- filename \t|space stuff
1471 1472 s = str[4:].rstrip('\r\n')
1472 1473 i = s.find('\t')
1473 1474 if i < 0:
1474 1475 i = s.find(' ')
1475 1476 if i < 0:
1476 1477 return s
1477 1478 return s[:i]
1478 1479
1479 1480 def reversehunks(hunks):
1480 1481 '''reverse the signs in the hunks given as argument
1481 1482
1482 1483 This function operates on hunks coming out of patch.filterpatch, that is
1483 1484 a list of the form: [header1, hunk1, hunk2, header2...]. Example usage:
1484 1485
1485 1486 >>> rawpatch = b"""diff --git a/folder1/g b/folder1/g
1486 1487 ... --- a/folder1/g
1487 1488 ... +++ b/folder1/g
1488 1489 ... @@ -1,7 +1,7 @@
1489 1490 ... +firstline
1490 1491 ... c
1491 1492 ... 1
1492 1493 ... 2
1493 1494 ... + 3
1494 1495 ... -4
1495 1496 ... 5
1496 1497 ... d
1497 1498 ... +lastline"""
1498 1499 >>> hunks = parsepatch([rawpatch])
1499 1500 >>> hunkscomingfromfilterpatch = []
1500 1501 >>> for h in hunks:
1501 1502 ... hunkscomingfromfilterpatch.append(h)
1502 1503 ... hunkscomingfromfilterpatch.extend(h.hunks)
1503 1504
1504 1505 >>> reversedhunks = reversehunks(hunkscomingfromfilterpatch)
1505 1506 >>> from . import util
1506 1507 >>> fp = util.stringio()
1507 1508 >>> for c in reversedhunks:
1508 1509 ... c.write(fp)
1509 1510 >>> fp.seek(0) or None
1510 1511 >>> reversedpatch = fp.read()
1511 1512 >>> print(pycompat.sysstr(reversedpatch))
1512 1513 diff --git a/folder1/g b/folder1/g
1513 1514 --- a/folder1/g
1514 1515 +++ b/folder1/g
1515 1516 @@ -1,4 +1,3 @@
1516 1517 -firstline
1517 1518 c
1518 1519 1
1519 1520 2
1520 1521 @@ -2,6 +1,6 @@
1521 1522 c
1522 1523 1
1523 1524 2
1524 1525 - 3
1525 1526 +4
1526 1527 5
1527 1528 d
1528 1529 @@ -6,3 +5,2 @@
1529 1530 5
1530 1531 d
1531 1532 -lastline
1532 1533
1533 1534 '''
1534 1535
1535 1536 newhunks = []
1536 1537 for c in hunks:
1537 1538 if util.safehasattr(c, 'reversehunk'):
1538 1539 c = c.reversehunk()
1539 1540 newhunks.append(c)
1540 1541 return newhunks
1541 1542
1542 1543 def parsepatch(originalchunks, maxcontext=None):
1543 1544 """patch -> [] of headers -> [] of hunks
1544 1545
1545 1546 If maxcontext is not None, trim context lines if necessary.
1546 1547
1547 1548 >>> rawpatch = b'''diff --git a/folder1/g b/folder1/g
1548 1549 ... --- a/folder1/g
1549 1550 ... +++ b/folder1/g
1550 1551 ... @@ -1,8 +1,10 @@
1551 1552 ... 1
1552 1553 ... 2
1553 1554 ... -3
1554 1555 ... 4
1555 1556 ... 5
1556 1557 ... 6
1557 1558 ... +6.1
1558 1559 ... +6.2
1559 1560 ... 7
1560 1561 ... 8
1561 1562 ... +9'''
1562 1563 >>> out = util.stringio()
1563 1564 >>> headers = parsepatch([rawpatch], maxcontext=1)
1564 1565 >>> for header in headers:
1565 1566 ... header.write(out)
1566 1567 ... for hunk in header.hunks:
1567 1568 ... hunk.write(out)
1568 1569 >>> print(pycompat.sysstr(out.getvalue()))
1569 1570 diff --git a/folder1/g b/folder1/g
1570 1571 --- a/folder1/g
1571 1572 +++ b/folder1/g
1572 1573 @@ -2,3 +2,2 @@
1573 1574 2
1574 1575 -3
1575 1576 4
1576 1577 @@ -6,2 +5,4 @@
1577 1578 6
1578 1579 +6.1
1579 1580 +6.2
1580 1581 7
1581 1582 @@ -8,1 +9,2 @@
1582 1583 8
1583 1584 +9
1584 1585 """
1585 1586 class parser(object):
1586 1587 """patch parsing state machine"""
1587 1588 def __init__(self):
1588 1589 self.fromline = 0
1589 1590 self.toline = 0
1590 1591 self.proc = ''
1591 1592 self.header = None
1592 1593 self.context = []
1593 1594 self.before = []
1594 1595 self.hunk = []
1595 1596 self.headers = []
1596 1597
1597 1598 def addrange(self, limits):
1598 1599 fromstart, fromend, tostart, toend, proc = limits
1599 1600 self.fromline = int(fromstart)
1600 1601 self.toline = int(tostart)
1601 1602 self.proc = proc
1602 1603
1603 1604 def addcontext(self, context):
1604 1605 if self.hunk:
1605 1606 h = recordhunk(self.header, self.fromline, self.toline,
1606 1607 self.proc, self.before, self.hunk, context, maxcontext)
1607 1608 self.header.hunks.append(h)
1608 1609 self.fromline += len(self.before) + h.removed
1609 1610 self.toline += len(self.before) + h.added
1610 1611 self.before = []
1611 1612 self.hunk = []
1612 1613 self.context = context
1613 1614
1614 1615 def addhunk(self, hunk):
1615 1616 if self.context:
1616 1617 self.before = self.context
1617 1618 self.context = []
1618 1619 self.hunk = hunk
1619 1620
1620 1621 def newfile(self, hdr):
1621 1622 self.addcontext([])
1622 1623 h = header(hdr)
1623 1624 self.headers.append(h)
1624 1625 self.header = h
1625 1626
1626 1627 def addother(self, line):
1627 1628 pass # 'other' lines are ignored
1628 1629
1629 1630 def finished(self):
1630 1631 self.addcontext([])
1631 1632 return self.headers
1632 1633
1633 1634 transitions = {
1634 1635 'file': {'context': addcontext,
1635 1636 'file': newfile,
1636 1637 'hunk': addhunk,
1637 1638 'range': addrange},
1638 1639 'context': {'file': newfile,
1639 1640 'hunk': addhunk,
1640 1641 'range': addrange,
1641 1642 'other': addother},
1642 1643 'hunk': {'context': addcontext,
1643 1644 'file': newfile,
1644 1645 'range': addrange},
1645 1646 'range': {'context': addcontext,
1646 1647 'hunk': addhunk},
1647 1648 'other': {'other': addother},
1648 1649 }
1649 1650
1650 1651 p = parser()
1651 1652 fp = stringio()
1652 1653 fp.write(''.join(originalchunks))
1653 1654 fp.seek(0)
1654 1655
1655 1656 state = 'context'
1656 1657 for newstate, data in scanpatch(fp):
1657 1658 try:
1658 1659 p.transitions[state][newstate](p, data)
1659 1660 except KeyError:
1660 1661 raise PatchError('unhandled transition: %s -> %s' %
1661 1662 (state, newstate))
1662 1663 state = newstate
1663 1664 del fp
1664 1665 return p.finished()
1665 1666
1666 1667 def pathtransform(path, strip, prefix):
1667 1668 '''turn a path from a patch into a path suitable for the repository
1668 1669
1669 1670 prefix, if not empty, is expected to be normalized with a / at the end.
1670 1671
1671 1672 Returns (stripped components, path in repository).
1672 1673
1673 1674 >>> pathtransform(b'a/b/c', 0, b'')
1674 1675 ('', 'a/b/c')
1675 1676 >>> pathtransform(b' a/b/c ', 0, b'')
1676 1677 ('', ' a/b/c')
1677 1678 >>> pathtransform(b' a/b/c ', 2, b'')
1678 1679 ('a/b/', 'c')
1679 1680 >>> pathtransform(b'a/b/c', 0, b'd/e/')
1680 1681 ('', 'd/e/a/b/c')
1681 1682 >>> pathtransform(b' a//b/c ', 2, b'd/e/')
1682 1683 ('a//b/', 'd/e/c')
1683 1684 >>> pathtransform(b'a/b/c', 3, b'')
1684 1685 Traceback (most recent call last):
1685 1686 PatchError: unable to strip away 1 of 3 dirs from a/b/c
1686 1687 '''
1687 1688 pathlen = len(path)
1688 1689 i = 0
1689 1690 if strip == 0:
1690 1691 return '', prefix + path.rstrip()
1691 1692 count = strip
1692 1693 while count > 0:
1693 1694 i = path.find('/', i)
1694 1695 if i == -1:
1695 1696 raise PatchError(_("unable to strip away %d of %d dirs from %s") %
1696 1697 (count, strip, path))
1697 1698 i += 1
1698 1699 # consume '//' in the path
1699 1700 while i < pathlen - 1 and path[i:i + 1] == '/':
1700 1701 i += 1
1701 1702 count -= 1
1702 1703 return path[:i].lstrip(), prefix + path[i:].rstrip()
1703 1704
1704 1705 def makepatchmeta(backend, afile_orig, bfile_orig, hunk, strip, prefix):
1705 1706 nulla = afile_orig == "/dev/null"
1706 1707 nullb = bfile_orig == "/dev/null"
1707 1708 create = nulla and hunk.starta == 0 and hunk.lena == 0
1708 1709 remove = nullb and hunk.startb == 0 and hunk.lenb == 0
1709 1710 abase, afile = pathtransform(afile_orig, strip, prefix)
1710 1711 gooda = not nulla and backend.exists(afile)
1711 1712 bbase, bfile = pathtransform(bfile_orig, strip, prefix)
1712 1713 if afile == bfile:
1713 1714 goodb = gooda
1714 1715 else:
1715 1716 goodb = not nullb and backend.exists(bfile)
1716 1717 missing = not goodb and not gooda and not create
1717 1718
1718 1719 # some diff programs apparently produce patches where the afile is
1719 1720 # not /dev/null, but afile starts with bfile
1720 1721 abasedir = afile[:afile.rfind('/') + 1]
1721 1722 bbasedir = bfile[:bfile.rfind('/') + 1]
1722 1723 if (missing and abasedir == bbasedir and afile.startswith(bfile)
1723 1724 and hunk.starta == 0 and hunk.lena == 0):
1724 1725 create = True
1725 1726 missing = False
1726 1727
1727 1728 # If afile is "a/b/foo" and bfile is "a/b/foo.orig" we assume the
1728 1729 # diff is between a file and its backup. In this case, the original
1729 1730 # file should be patched (see original mpatch code).
1730 1731 isbackup = (abase == bbase and bfile.startswith(afile))
1731 1732 fname = None
1732 1733 if not missing:
1733 1734 if gooda and goodb:
1734 1735 if isbackup:
1735 1736 fname = afile
1736 1737 else:
1737 1738 fname = bfile
1738 1739 elif gooda:
1739 1740 fname = afile
1740 1741
1741 1742 if not fname:
1742 1743 if not nullb:
1743 1744 if isbackup:
1744 1745 fname = afile
1745 1746 else:
1746 1747 fname = bfile
1747 1748 elif not nulla:
1748 1749 fname = afile
1749 1750 else:
1750 1751 raise PatchError(_("undefined source and destination files"))
1751 1752
1752 1753 gp = patchmeta(fname)
1753 1754 if create:
1754 1755 gp.op = 'ADD'
1755 1756 elif remove:
1756 1757 gp.op = 'DELETE'
1757 1758 return gp
1758 1759
1759 1760 def scanpatch(fp):
1760 1761 """like patch.iterhunks, but yield different events
1761 1762
1762 1763 - ('file', [header_lines + fromfile + tofile])
1763 1764 - ('context', [context_lines])
1764 1765 - ('hunk', [hunk_lines])
1765 1766 - ('range', (-start,len, +start,len, proc))
1766 1767 """
1767 1768 lines_re = re.compile(br'@@ -(\d+),(\d+) \+(\d+),(\d+) @@\s*(.*)')
1768 1769 lr = linereader(fp)
1769 1770
1770 1771 def scanwhile(first, p):
1771 1772 """scan lr while predicate holds"""
1772 1773 lines = [first]
1773 1774 for line in iter(lr.readline, ''):
1774 1775 if p(line):
1775 1776 lines.append(line)
1776 1777 else:
1777 1778 lr.push(line)
1778 1779 break
1779 1780 return lines
1780 1781
1781 1782 for line in iter(lr.readline, ''):
1782 1783 if line.startswith('diff --git a/') or line.startswith('diff -r '):
1783 1784 def notheader(line):
1784 1785 s = line.split(None, 1)
1785 1786 return not s or s[0] not in ('---', 'diff')
1786 1787 header = scanwhile(line, notheader)
1787 1788 fromfile = lr.readline()
1788 1789 if fromfile.startswith('---'):
1789 1790 tofile = lr.readline()
1790 1791 header += [fromfile, tofile]
1791 1792 else:
1792 1793 lr.push(fromfile)
1793 1794 yield 'file', header
1794 1795 elif line[0:1] == ' ':
1795 1796 yield 'context', scanwhile(line, lambda l: l[0] in ' \\')
1796 1797 elif line[0] in '-+':
1797 1798 yield 'hunk', scanwhile(line, lambda l: l[0] in '-+\\')
1798 1799 else:
1799 1800 m = lines_re.match(line)
1800 1801 if m:
1801 1802 yield 'range', m.groups()
1802 1803 else:
1803 1804 yield 'other', line
1804 1805
1805 1806 def scangitpatch(lr, firstline):
1806 1807 """
1807 1808 Git patches can emit:
1808 1809 - rename a to b
1809 1810 - change b
1810 1811 - copy a to c
1811 1812 - change c
1812 1813
1813 1814 We cannot apply this sequence as-is, the renamed 'a' could not be
1814 1815 found for it would have been renamed already. And we cannot copy
1815 1816 from 'b' instead because 'b' would have been changed already. So
1816 1817 we scan the git patch for copy and rename commands so we can
1817 1818 perform the copies ahead of time.
1818 1819 """
1819 1820 pos = 0
1820 1821 try:
1821 1822 pos = lr.fp.tell()
1822 1823 fp = lr.fp
1823 1824 except IOError:
1824 1825 fp = stringio(lr.fp.read())
1825 1826 gitlr = linereader(fp)
1826 1827 gitlr.push(firstline)
1827 1828 gitpatches = readgitpatch(gitlr)
1828 1829 fp.seek(pos)
1829 1830 return gitpatches
1830 1831
1831 1832 def iterhunks(fp):
1832 1833 """Read a patch and yield the following events:
1833 1834 - ("file", afile, bfile, firsthunk): select a new target file.
1834 1835 - ("hunk", hunk): a new hunk is ready to be applied, follows a
1835 1836 "file" event.
1836 1837 - ("git", gitchanges): current diff is in git format, gitchanges
1837 1838 maps filenames to gitpatch records. Unique event.
1838 1839 """
1839 1840 afile = ""
1840 1841 bfile = ""
1841 1842 state = None
1842 1843 hunknum = 0
1843 1844 emitfile = newfile = False
1844 1845 gitpatches = None
1845 1846
1846 1847 # our states
1847 1848 BFILE = 1
1848 1849 context = None
1849 1850 lr = linereader(fp)
1850 1851
1851 1852 for x in iter(lr.readline, ''):
1852 1853 if state == BFILE and (
1853 1854 (not context and x[0] == '@')
1854 1855 or (context is not False and x.startswith('***************'))
1855 1856 or x.startswith('GIT binary patch')):
1856 1857 gp = None
1857 1858 if (gitpatches and
1858 1859 gitpatches[-1].ispatching(afile, bfile)):
1859 1860 gp = gitpatches.pop()
1860 1861 if x.startswith('GIT binary patch'):
1861 1862 h = binhunk(lr, gp.path)
1862 1863 else:
1863 1864 if context is None and x.startswith('***************'):
1864 1865 context = True
1865 1866 h = hunk(x, hunknum + 1, lr, context)
1866 1867 hunknum += 1
1867 1868 if emitfile:
1868 1869 emitfile = False
1869 1870 yield 'file', (afile, bfile, h, gp and gp.copy() or None)
1870 1871 yield 'hunk', h
1871 1872 elif x.startswith('diff --git a/'):
1872 1873 m = gitre.match(x.rstrip(' \r\n'))
1873 1874 if not m:
1874 1875 continue
1875 1876 if gitpatches is None:
1876 1877 # scan whole input for git metadata
1877 1878 gitpatches = scangitpatch(lr, x)
1878 1879 yield 'git', [g.copy() for g in gitpatches
1879 1880 if g.op in ('COPY', 'RENAME')]
1880 1881 gitpatches.reverse()
1881 1882 afile = 'a/' + m.group(1)
1882 1883 bfile = 'b/' + m.group(2)
1883 1884 while gitpatches and not gitpatches[-1].ispatching(afile, bfile):
1884 1885 gp = gitpatches.pop()
1885 1886 yield 'file', ('a/' + gp.path, 'b/' + gp.path, None, gp.copy())
1886 1887 if not gitpatches:
1887 1888 raise PatchError(_('failed to synchronize metadata for "%s"')
1888 1889 % afile[2:])
1889 1890 gp = gitpatches[-1]
1890 1891 newfile = True
1891 1892 elif x.startswith('---'):
1892 1893 # check for a unified diff
1893 1894 l2 = lr.readline()
1894 1895 if not l2.startswith('+++'):
1895 1896 lr.push(l2)
1896 1897 continue
1897 1898 newfile = True
1898 1899 context = False
1899 1900 afile = parsefilename(x)
1900 1901 bfile = parsefilename(l2)
1901 1902 elif x.startswith('***'):
1902 1903 # check for a context diff
1903 1904 l2 = lr.readline()
1904 1905 if not l2.startswith('---'):
1905 1906 lr.push(l2)
1906 1907 continue
1907 1908 l3 = lr.readline()
1908 1909 lr.push(l3)
1909 1910 if not l3.startswith("***************"):
1910 1911 lr.push(l2)
1911 1912 continue
1912 1913 newfile = True
1913 1914 context = True
1914 1915 afile = parsefilename(x)
1915 1916 bfile = parsefilename(l2)
1916 1917
1917 1918 if newfile:
1918 1919 newfile = False
1919 1920 emitfile = True
1920 1921 state = BFILE
1921 1922 hunknum = 0
1922 1923
1923 1924 while gitpatches:
1924 1925 gp = gitpatches.pop()
1925 1926 yield 'file', ('a/' + gp.path, 'b/' + gp.path, None, gp.copy())
1926 1927
1927 1928 def applybindelta(binchunk, data):
1928 1929 """Apply a binary delta hunk
1929 1930 The algorithm used is the algorithm from git's patch-delta.c
1930 1931 """
1931 1932 def deltahead(binchunk):
1932 1933 i = 0
1933 1934 for c in binchunk:
1934 1935 i += 1
1935 1936 if not (ord(c) & 0x80):
1936 1937 return i
1937 1938 return i
1938 1939 out = ""
1939 1940 s = deltahead(binchunk)
1940 1941 binchunk = binchunk[s:]
1941 1942 s = deltahead(binchunk)
1942 1943 binchunk = binchunk[s:]
1943 1944 i = 0
1944 1945 while i < len(binchunk):
1945 1946 cmd = ord(binchunk[i])
1946 1947 i += 1
1947 1948 if (cmd & 0x80):
1948 1949 offset = 0
1949 1950 size = 0
1950 1951 if (cmd & 0x01):
1951 1952 offset = ord(binchunk[i])
1952 1953 i += 1
1953 1954 if (cmd & 0x02):
1954 1955 offset |= ord(binchunk[i]) << 8
1955 1956 i += 1
1956 1957 if (cmd & 0x04):
1957 1958 offset |= ord(binchunk[i]) << 16
1958 1959 i += 1
1959 1960 if (cmd & 0x08):
1960 1961 offset |= ord(binchunk[i]) << 24
1961 1962 i += 1
1962 1963 if (cmd & 0x10):
1963 1964 size = ord(binchunk[i])
1964 1965 i += 1
1965 1966 if (cmd & 0x20):
1966 1967 size |= ord(binchunk[i]) << 8
1967 1968 i += 1
1968 1969 if (cmd & 0x40):
1969 1970 size |= ord(binchunk[i]) << 16
1970 1971 i += 1
1971 1972 if size == 0:
1972 1973 size = 0x10000
1973 1974 offset_end = offset + size
1974 1975 out += data[offset:offset_end]
1975 1976 elif cmd != 0:
1976 1977 offset_end = i + cmd
1977 1978 out += binchunk[i:offset_end]
1978 1979 i += cmd
1979 1980 else:
1980 1981 raise PatchError(_('unexpected delta opcode 0'))
1981 1982 return out
1982 1983
1983 1984 def applydiff(ui, fp, backend, store, strip=1, prefix='', eolmode='strict'):
1984 1985 """Reads a patch from fp and tries to apply it.
1985 1986
1986 1987 Returns 0 for a clean patch, -1 if any rejects were found and 1 if
1987 1988 there was any fuzz.
1988 1989
1989 1990 If 'eolmode' is 'strict', the patch content and patched file are
1990 1991 read in binary mode. Otherwise, line endings are ignored when
1991 1992 patching then normalized according to 'eolmode'.
1992 1993 """
1993 1994 return _applydiff(ui, fp, patchfile, backend, store, strip=strip,
1994 1995 prefix=prefix, eolmode=eolmode)
1995 1996
1996 1997 def _canonprefix(repo, prefix):
1997 1998 if prefix:
1998 1999 prefix = pathutil.canonpath(repo.root, repo.getcwd(), prefix)
1999 2000 if prefix != '':
2000 2001 prefix += '/'
2001 2002 return prefix
2002 2003
2003 2004 def _applydiff(ui, fp, patcher, backend, store, strip=1, prefix='',
2004 2005 eolmode='strict'):
2005 2006 prefix = _canonprefix(backend.repo, prefix)
2006 2007 def pstrip(p):
2007 2008 return pathtransform(p, strip - 1, prefix)[1]
2008 2009
2009 2010 rejects = 0
2010 2011 err = 0
2011 2012 current_file = None
2012 2013
2013 2014 for state, values in iterhunks(fp):
2014 2015 if state == 'hunk':
2015 2016 if not current_file:
2016 2017 continue
2017 2018 ret = current_file.apply(values)
2018 2019 if ret > 0:
2019 2020 err = 1
2020 2021 elif state == 'file':
2021 2022 if current_file:
2022 2023 rejects += current_file.close()
2023 2024 current_file = None
2024 2025 afile, bfile, first_hunk, gp = values
2025 2026 if gp:
2026 2027 gp.path = pstrip(gp.path)
2027 2028 if gp.oldpath:
2028 2029 gp.oldpath = pstrip(gp.oldpath)
2029 2030 else:
2030 2031 gp = makepatchmeta(backend, afile, bfile, first_hunk, strip,
2031 2032 prefix)
2032 2033 if gp.op == 'RENAME':
2033 2034 backend.unlink(gp.oldpath)
2034 2035 if not first_hunk:
2035 2036 if gp.op == 'DELETE':
2036 2037 backend.unlink(gp.path)
2037 2038 continue
2038 2039 data, mode = None, None
2039 2040 if gp.op in ('RENAME', 'COPY'):
2040 2041 data, mode = store.getfile(gp.oldpath)[:2]
2041 2042 if data is None:
2042 2043 # This means that the old path does not exist
2043 2044 raise PatchError(_("source file '%s' does not exist")
2044 2045 % gp.oldpath)
2045 2046 if gp.mode:
2046 2047 mode = gp.mode
2047 2048 if gp.op == 'ADD':
2048 2049 # Added files without content have no hunk and
2049 2050 # must be created
2050 2051 data = ''
2051 2052 if data or mode:
2052 2053 if (gp.op in ('ADD', 'RENAME', 'COPY')
2053 2054 and backend.exists(gp.path)):
2054 2055 raise PatchError(_("cannot create %s: destination "
2055 2056 "already exists") % gp.path)
2056 2057 backend.setfile(gp.path, data, mode, gp.oldpath)
2057 2058 continue
2058 2059 try:
2059 2060 current_file = patcher(ui, gp, backend, store,
2060 2061 eolmode=eolmode)
2061 2062 except PatchError as inst:
2062 2063 ui.warn(str(inst) + '\n')
2063 2064 current_file = None
2064 2065 rejects += 1
2065 2066 continue
2066 2067 elif state == 'git':
2067 2068 for gp in values:
2068 2069 path = pstrip(gp.oldpath)
2069 2070 data, mode = backend.getfile(path)
2070 2071 if data is None:
2071 2072 # The error ignored here will trigger a getfile()
2072 2073 # error in a place more appropriate for error
2073 2074 # handling, and will not interrupt the patching
2074 2075 # process.
2075 2076 pass
2076 2077 else:
2077 2078 store.setfile(path, data, mode)
2078 2079 else:
2079 2080 raise error.Abort(_('unsupported parser state: %s') % state)
2080 2081
2081 2082 if current_file:
2082 2083 rejects += current_file.close()
2083 2084
2084 2085 if rejects:
2085 2086 return -1
2086 2087 return err
2087 2088
2088 2089 def _externalpatch(ui, repo, patcher, patchname, strip, files,
2089 2090 similarity):
2090 2091 """use <patcher> to apply <patchname> to the working directory.
2091 2092 returns whether patch was applied with fuzz factor."""
2092 2093
2093 2094 fuzz = False
2094 2095 args = []
2095 2096 cwd = repo.root
2096 2097 if cwd:
2097 2098 args.append('-d %s' % util.shellquote(cwd))
2098 2099 fp = util.popen('%s %s -p%d < %s' % (patcher, ' '.join(args), strip,
2099 2100 util.shellquote(patchname)))
2100 2101 try:
2101 2102 for line in util.iterfile(fp):
2102 2103 line = line.rstrip()
2103 2104 ui.note(line + '\n')
2104 2105 if line.startswith('patching file '):
2105 2106 pf = util.parsepatchoutput(line)
2106 2107 printed_file = False
2107 2108 files.add(pf)
2108 2109 elif line.find('with fuzz') >= 0:
2109 2110 fuzz = True
2110 2111 if not printed_file:
2111 2112 ui.warn(pf + '\n')
2112 2113 printed_file = True
2113 2114 ui.warn(line + '\n')
2114 2115 elif line.find('saving rejects to file') >= 0:
2115 2116 ui.warn(line + '\n')
2116 2117 elif line.find('FAILED') >= 0:
2117 2118 if not printed_file:
2118 2119 ui.warn(pf + '\n')
2119 2120 printed_file = True
2120 2121 ui.warn(line + '\n')
2121 2122 finally:
2122 2123 if files:
2123 2124 scmutil.marktouched(repo, files, similarity)
2124 2125 code = fp.close()
2125 2126 if code:
2126 2127 raise PatchError(_("patch command failed: %s") %
2127 2128 util.explainexit(code)[0])
2128 2129 return fuzz
2129 2130
2130 2131 def patchbackend(ui, backend, patchobj, strip, prefix, files=None,
2131 2132 eolmode='strict'):
2132 2133 if files is None:
2133 2134 files = set()
2134 2135 if eolmode is None:
2135 2136 eolmode = ui.config('patch', 'eol')
2136 2137 if eolmode.lower() not in eolmodes:
2137 2138 raise error.Abort(_('unsupported line endings type: %s') % eolmode)
2138 2139 eolmode = eolmode.lower()
2139 2140
2140 2141 store = filestore()
2141 2142 try:
2142 2143 fp = open(patchobj, 'rb')
2143 2144 except TypeError:
2144 2145 fp = patchobj
2145 2146 try:
2146 2147 ret = applydiff(ui, fp, backend, store, strip=strip, prefix=prefix,
2147 2148 eolmode=eolmode)
2148 2149 finally:
2149 2150 if fp != patchobj:
2150 2151 fp.close()
2151 2152 files.update(backend.close())
2152 2153 store.close()
2153 2154 if ret < 0:
2154 2155 raise PatchError(_('patch failed to apply'))
2155 2156 return ret > 0
2156 2157
2157 2158 def internalpatch(ui, repo, patchobj, strip, prefix='', files=None,
2158 2159 eolmode='strict', similarity=0):
2159 2160 """use builtin patch to apply <patchobj> to the working directory.
2160 2161 returns whether patch was applied with fuzz factor."""
2161 2162 backend = workingbackend(ui, repo, similarity)
2162 2163 return patchbackend(ui, backend, patchobj, strip, prefix, files, eolmode)
2163 2164
2164 2165 def patchrepo(ui, repo, ctx, store, patchobj, strip, prefix, files=None,
2165 2166 eolmode='strict'):
2166 2167 backend = repobackend(ui, repo, ctx, store)
2167 2168 return patchbackend(ui, backend, patchobj, strip, prefix, files, eolmode)
2168 2169
2169 2170 def patch(ui, repo, patchname, strip=1, prefix='', files=None, eolmode='strict',
2170 2171 similarity=0):
2171 2172 """Apply <patchname> to the working directory.
2172 2173
2173 2174 'eolmode' specifies how end of lines should be handled. It can be:
2174 2175 - 'strict': inputs are read in binary mode, EOLs are preserved
2175 2176 - 'crlf': EOLs are ignored when patching and reset to CRLF
2176 2177 - 'lf': EOLs are ignored when patching and reset to LF
2177 2178 - None: get it from user settings, default to 'strict'
2178 2179 'eolmode' is ignored when using an external patcher program.
2179 2180
2180 2181 Returns whether patch was applied with fuzz factor.
2181 2182 """
2182 2183 patcher = ui.config('ui', 'patch')
2183 2184 if files is None:
2184 2185 files = set()
2185 2186 if patcher:
2186 2187 return _externalpatch(ui, repo, patcher, patchname, strip,
2187 2188 files, similarity)
2188 2189 return internalpatch(ui, repo, patchname, strip, prefix, files, eolmode,
2189 2190 similarity)
2190 2191
2191 2192 def changedfiles(ui, repo, patchpath, strip=1, prefix=''):
2192 2193 backend = fsbackend(ui, repo.root)
2193 2194 prefix = _canonprefix(repo, prefix)
2194 2195 with open(patchpath, 'rb') as fp:
2195 2196 changed = set()
2196 2197 for state, values in iterhunks(fp):
2197 2198 if state == 'file':
2198 2199 afile, bfile, first_hunk, gp = values
2199 2200 if gp:
2200 2201 gp.path = pathtransform(gp.path, strip - 1, prefix)[1]
2201 2202 if gp.oldpath:
2202 2203 gp.oldpath = pathtransform(gp.oldpath, strip - 1,
2203 2204 prefix)[1]
2204 2205 else:
2205 2206 gp = makepatchmeta(backend, afile, bfile, first_hunk, strip,
2206 2207 prefix)
2207 2208 changed.add(gp.path)
2208 2209 if gp.op == 'RENAME':
2209 2210 changed.add(gp.oldpath)
2210 2211 elif state not in ('hunk', 'git'):
2211 2212 raise error.Abort(_('unsupported parser state: %s') % state)
2212 2213 return changed
2213 2214
2214 2215 class GitDiffRequired(Exception):
2215 2216 pass
2216 2217
2217 2218 def diffallopts(ui, opts=None, untrusted=False, section='diff'):
2218 2219 '''return diffopts with all features supported and parsed'''
2219 2220 return difffeatureopts(ui, opts=opts, untrusted=untrusted, section=section,
2220 2221 git=True, whitespace=True, formatchanging=True)
2221 2222
2222 2223 diffopts = diffallopts
2223 2224
2224 2225 def difffeatureopts(ui, opts=None, untrusted=False, section='diff', git=False,
2225 2226 whitespace=False, formatchanging=False):
2226 2227 '''return diffopts with only opted-in features parsed
2227 2228
2228 2229 Features:
2229 2230 - git: git-style diffs
2230 2231 - whitespace: whitespace options like ignoreblanklines and ignorews
2231 2232 - formatchanging: options that will likely break or cause correctness issues
2232 2233 with most diff parsers
2233 2234 '''
2234 2235 def get(key, name=None, getter=ui.configbool, forceplain=None):
2235 2236 if opts:
2236 2237 v = opts.get(key)
2237 2238 # diffopts flags are either None-default (which is passed
2238 2239 # through unchanged, so we can identify unset values), or
2239 2240 # some other falsey default (eg --unified, which defaults
2240 2241 # to an empty string). We only want to override the config
2241 2242 # entries from hgrc with command line values if they
2242 2243 # appear to have been set, which is any truthy value,
2243 2244 # True, or False.
2244 2245 if v or isinstance(v, bool):
2245 2246 return v
2246 2247 if forceplain is not None and ui.plain():
2247 2248 return forceplain
2248 2249 return getter(section, name or key, untrusted=untrusted)
2249 2250
2250 2251 # core options, expected to be understood by every diff parser
2251 2252 buildopts = {
2252 2253 'nodates': get('nodates'),
2253 2254 'showfunc': get('show_function', 'showfunc'),
2254 2255 'context': get('unified', getter=ui.config),
2255 2256 }
2256 2257 buildopts['worddiff'] = ui.configbool('experimental', 'worddiff')
2257 2258
2258 2259 if git:
2259 2260 buildopts['git'] = get('git')
2260 2261
2261 2262 # since this is in the experimental section, we need to call
2262 2263 # ui.configbool directory
2263 2264 buildopts['showsimilarity'] = ui.configbool('experimental',
2264 2265 'extendedheader.similarity')
2265 2266
2266 2267 # need to inspect the ui object instead of using get() since we want to
2267 2268 # test for an int
2268 2269 hconf = ui.config('experimental', 'extendedheader.index')
2269 2270 if hconf is not None:
2270 2271 hlen = None
2271 2272 try:
2272 2273 # the hash config could be an integer (for length of hash) or a
2273 2274 # word (e.g. short, full, none)
2274 2275 hlen = int(hconf)
2275 2276 if hlen < 0 or hlen > 40:
2276 2277 msg = _("invalid length for extendedheader.index: '%d'\n")
2277 2278 ui.warn(msg % hlen)
2278 2279 except ValueError:
2279 2280 # default value
2280 2281 if hconf == 'short' or hconf == '':
2281 2282 hlen = 12
2282 2283 elif hconf == 'full':
2283 2284 hlen = 40
2284 2285 elif hconf != 'none':
2285 2286 msg = _("invalid value for extendedheader.index: '%s'\n")
2286 2287 ui.warn(msg % hconf)
2287 2288 finally:
2288 2289 buildopts['index'] = hlen
2289 2290
2290 2291 if whitespace:
2291 2292 buildopts['ignorews'] = get('ignore_all_space', 'ignorews')
2292 2293 buildopts['ignorewsamount'] = get('ignore_space_change',
2293 2294 'ignorewsamount')
2294 2295 buildopts['ignoreblanklines'] = get('ignore_blank_lines',
2295 2296 'ignoreblanklines')
2296 2297 buildopts['ignorewseol'] = get('ignore_space_at_eol', 'ignorewseol')
2297 2298 if formatchanging:
2298 2299 buildopts['text'] = opts and opts.get('text')
2299 2300 binary = None if opts is None else opts.get('binary')
2300 2301 buildopts['nobinary'] = (not binary if binary is not None
2301 2302 else get('nobinary', forceplain=False))
2302 2303 buildopts['noprefix'] = get('noprefix', forceplain=False)
2303 2304
2304 2305 return mdiff.diffopts(**pycompat.strkwargs(buildopts))
2305 2306
2306 2307 def diff(repo, node1=None, node2=None, match=None, changes=None,
2307 2308 opts=None, losedatafn=None, prefix='', relroot='', copy=None,
2308 2309 hunksfilterfn=None):
2309 2310 '''yields diff of changes to files between two nodes, or node and
2310 2311 working directory.
2311 2312
2312 2313 if node1 is None, use first dirstate parent instead.
2313 2314 if node2 is None, compare node1 with working directory.
2314 2315
2315 2316 losedatafn(**kwarg) is a callable run when opts.upgrade=True and
2316 2317 every time some change cannot be represented with the current
2317 2318 patch format. Return False to upgrade to git patch format, True to
2318 2319 accept the loss or raise an exception to abort the diff. It is
2319 2320 called with the name of current file being diffed as 'fn'. If set
2320 2321 to None, patches will always be upgraded to git format when
2321 2322 necessary.
2322 2323
2323 2324 prefix is a filename prefix that is prepended to all filenames on
2324 2325 display (used for subrepos).
2325 2326
2326 2327 relroot, if not empty, must be normalized with a trailing /. Any match
2327 2328 patterns that fall outside it will be ignored.
2328 2329
2329 2330 copy, if not empty, should contain mappings {dst@y: src@x} of copy
2330 2331 information.
2331 2332
2332 2333 hunksfilterfn, if not None, should be a function taking a filectx and
2333 2334 hunks generator that may yield filtered hunks.
2334 2335 '''
2335 2336 for fctx1, fctx2, hdr, hunks in diffhunks(
2336 2337 repo, node1=node1, node2=node2,
2337 2338 match=match, changes=changes, opts=opts,
2338 2339 losedatafn=losedatafn, prefix=prefix, relroot=relroot, copy=copy,
2339 2340 ):
2340 2341 if hunksfilterfn is not None:
2341 2342 # If the file has been removed, fctx2 is None; but this should
2342 2343 # not occur here since we catch removed files early in
2343 2344 # cmdutil.getloglinerangerevs() for 'hg log -L'.
2344 2345 assert fctx2 is not None, \
2345 2346 'fctx2 unexpectly None in diff hunks filtering'
2346 2347 hunks = hunksfilterfn(fctx2, hunks)
2347 2348 text = ''.join(sum((list(hlines) for hrange, hlines in hunks), []))
2348 2349 if hdr and (text or len(hdr) > 1):
2349 2350 yield '\n'.join(hdr) + '\n'
2350 2351 if text:
2351 2352 yield text
2352 2353
2353 2354 def diffhunks(repo, node1=None, node2=None, match=None, changes=None,
2354 2355 opts=None, losedatafn=None, prefix='', relroot='', copy=None):
2355 2356 """Yield diff of changes to files in the form of (`header`, `hunks`) tuples
2356 2357 where `header` is a list of diff headers and `hunks` is an iterable of
2357 2358 (`hunkrange`, `hunklines`) tuples.
2358 2359
2359 2360 See diff() for the meaning of parameters.
2360 2361 """
2361 2362
2362 2363 if opts is None:
2363 2364 opts = mdiff.defaultopts
2364 2365
2365 2366 if not node1 and not node2:
2366 2367 node1 = repo.dirstate.p1()
2367 2368
2368 2369 def lrugetfilectx():
2369 2370 cache = {}
2370 2371 order = collections.deque()
2371 2372 def getfilectx(f, ctx):
2372 2373 fctx = ctx.filectx(f, filelog=cache.get(f))
2373 2374 if f not in cache:
2374 2375 if len(cache) > 20:
2375 2376 del cache[order.popleft()]
2376 2377 cache[f] = fctx.filelog()
2377 2378 else:
2378 2379 order.remove(f)
2379 2380 order.append(f)
2380 2381 return fctx
2381 2382 return getfilectx
2382 2383 getfilectx = lrugetfilectx()
2383 2384
2384 2385 ctx1 = repo[node1]
2385 2386 ctx2 = repo[node2]
2386 2387
2387 2388 relfiltered = False
2388 2389 if relroot != '' and match.always():
2389 2390 # as a special case, create a new matcher with just the relroot
2390 2391 pats = [relroot]
2391 2392 match = scmutil.match(ctx2, pats, default='path')
2392 2393 relfiltered = True
2393 2394
2394 2395 if not changes:
2395 2396 changes = repo.status(ctx1, ctx2, match=match)
2396 2397 modified, added, removed = changes[:3]
2397 2398
2398 2399 if not modified and not added and not removed:
2399 2400 return []
2400 2401
2401 2402 if repo.ui.debugflag:
2402 2403 hexfunc = hex
2403 2404 else:
2404 2405 hexfunc = short
2405 2406 revs = [hexfunc(node) for node in [ctx1.node(), ctx2.node()] if node]
2406 2407
2407 2408 if copy is None:
2408 2409 copy = {}
2409 2410 if opts.git or opts.upgrade:
2410 2411 copy = copies.pathcopies(ctx1, ctx2, match=match)
2411 2412
2412 2413 if relroot is not None:
2413 2414 if not relfiltered:
2414 2415 # XXX this would ideally be done in the matcher, but that is
2415 2416 # generally meant to 'or' patterns, not 'and' them. In this case we
2416 2417 # need to 'and' all the patterns from the matcher with relroot.
2417 2418 def filterrel(l):
2418 2419 return [f for f in l if f.startswith(relroot)]
2419 2420 modified = filterrel(modified)
2420 2421 added = filterrel(added)
2421 2422 removed = filterrel(removed)
2422 2423 relfiltered = True
2423 2424 # filter out copies where either side isn't inside the relative root
2424 2425 copy = dict(((dst, src) for (dst, src) in copy.iteritems()
2425 2426 if dst.startswith(relroot)
2426 2427 and src.startswith(relroot)))
2427 2428
2428 2429 modifiedset = set(modified)
2429 2430 addedset = set(added)
2430 2431 removedset = set(removed)
2431 2432 for f in modified:
2432 2433 if f not in ctx1:
2433 2434 # Fix up added, since merged-in additions appear as
2434 2435 # modifications during merges
2435 2436 modifiedset.remove(f)
2436 2437 addedset.add(f)
2437 2438 for f in removed:
2438 2439 if f not in ctx1:
2439 2440 # Merged-in additions that are then removed are reported as removed.
2440 2441 # They are not in ctx1, so We don't want to show them in the diff.
2441 2442 removedset.remove(f)
2442 2443 modified = sorted(modifiedset)
2443 2444 added = sorted(addedset)
2444 2445 removed = sorted(removedset)
2445 2446 for dst, src in copy.items():
2446 2447 if src not in ctx1:
2447 2448 # Files merged in during a merge and then copied/renamed are
2448 2449 # reported as copies. We want to show them in the diff as additions.
2449 2450 del copy[dst]
2450 2451
2451 2452 def difffn(opts, losedata):
2452 2453 return trydiff(repo, revs, ctx1, ctx2, modified, added, removed,
2453 2454 copy, getfilectx, opts, losedata, prefix, relroot)
2454 2455 if opts.upgrade and not opts.git:
2455 2456 try:
2456 2457 def losedata(fn):
2457 2458 if not losedatafn or not losedatafn(fn=fn):
2458 2459 raise GitDiffRequired
2459 2460 # Buffer the whole output until we are sure it can be generated
2460 2461 return list(difffn(opts.copy(git=False), losedata))
2461 2462 except GitDiffRequired:
2462 2463 return difffn(opts.copy(git=True), None)
2463 2464 else:
2464 2465 return difffn(opts, None)
2465 2466
2466 2467 def difflabel(func, *args, **kw):
2467 2468 '''yields 2-tuples of (output, label) based on the output of func()'''
2468 2469 inlinecolor = False
2469 2470 if kw.get(r'opts'):
2470 2471 inlinecolor = kw[r'opts'].worddiff
2471 2472 headprefixes = [('diff', 'diff.diffline'),
2472 2473 ('copy', 'diff.extended'),
2473 2474 ('rename', 'diff.extended'),
2474 2475 ('old', 'diff.extended'),
2475 2476 ('new', 'diff.extended'),
2476 2477 ('deleted', 'diff.extended'),
2477 2478 ('index', 'diff.extended'),
2478 2479 ('similarity', 'diff.extended'),
2479 2480 ('---', 'diff.file_a'),
2480 2481 ('+++', 'diff.file_b')]
2481 2482 textprefixes = [('@', 'diff.hunk'),
2482 2483 ('-', 'diff.deleted'),
2483 2484 ('+', 'diff.inserted')]
2484 2485 head = False
2485 2486 for chunk in func(*args, **kw):
2486 2487 lines = chunk.split('\n')
2487 2488 matches = {}
2488 2489 if inlinecolor:
2489 2490 matches = _findmatches(lines)
2490 2491 for i, line in enumerate(lines):
2491 2492 if i != 0:
2492 2493 yield ('\n', '')
2493 2494 if head:
2494 2495 if line.startswith('@'):
2495 2496 head = False
2496 2497 else:
2497 2498 if line and line[0] not in ' +-@\\':
2498 2499 head = True
2499 2500 stripline = line
2500 2501 diffline = False
2501 2502 if not head and line and line[0] in '+-':
2502 2503 # highlight tabs and trailing whitespace, but only in
2503 2504 # changed lines
2504 2505 stripline = line.rstrip()
2505 2506 diffline = True
2506 2507
2507 2508 prefixes = textprefixes
2508 2509 if head:
2509 2510 prefixes = headprefixes
2510 2511 for prefix, label in prefixes:
2511 2512 if stripline.startswith(prefix):
2512 2513 if diffline:
2513 2514 if i in matches:
2514 2515 for t, l in _inlinediff(lines[i].rstrip(),
2515 2516 lines[matches[i]].rstrip(),
2516 2517 label):
2517 2518 yield (t, l)
2518 2519 else:
2519 2520 for token in tabsplitter.findall(stripline):
2520 2521 if '\t' == token[0]:
2521 2522 yield (token, 'diff.tab')
2522 2523 else:
2523 2524 yield (token, label)
2524 2525 else:
2525 2526 yield (stripline, label)
2526 2527 break
2527 2528 else:
2528 2529 yield (line, '')
2529 2530 if line != stripline:
2530 2531 yield (line[len(stripline):], 'diff.trailingwhitespace')
2531 2532
2532 2533 def _findmatches(slist):
2533 2534 '''Look for insertion matches to deletion and returns a dict of
2534 2535 correspondences.
2535 2536 '''
2536 2537 lastmatch = 0
2537 2538 matches = {}
2538 2539 for i, line in enumerate(slist):
2539 2540 if line == '':
2540 2541 continue
2541 2542 if line[0] == '-':
2542 2543 lastmatch = max(lastmatch, i)
2543 2544 newgroup = False
2544 2545 for j, newline in enumerate(slist[lastmatch + 1:]):
2545 2546 if newline == '':
2546 2547 continue
2547 2548 if newline[0] == '-' and newgroup: # too far, no match
2548 2549 break
2549 2550 if newline[0] == '+': # potential match
2550 2551 newgroup = True
2551 2552 sim = difflib.SequenceMatcher(None, line, newline).ratio()
2552 2553 if sim > 0.7:
2553 2554 lastmatch = lastmatch + 1 + j
2554 2555 matches[i] = lastmatch
2555 2556 matches[lastmatch] = i
2556 2557 break
2557 2558 return matches
2558 2559
2559 2560 def _inlinediff(s1, s2, operation):
2560 2561 '''Perform string diff to highlight specific changes.'''
2561 2562 operation_skip = '+?' if operation == 'diff.deleted' else '-?'
2562 2563 if operation == 'diff.deleted':
2563 2564 s2, s1 = s1, s2
2564 2565
2565 2566 buff = []
2566 2567 # we never want to higlight the leading +-
2567 2568 if operation == 'diff.deleted' and s2.startswith('-'):
2568 2569 label = operation
2569 2570 token = '-'
2570 2571 s2 = s2[1:]
2571 2572 s1 = s1[1:]
2572 2573 elif operation == 'diff.inserted' and s1.startswith('+'):
2573 2574 label = operation
2574 2575 token = '+'
2575 2576 s2 = s2[1:]
2576 2577 s1 = s1[1:]
2577 2578 else:
2578 2579 raise error.ProgrammingError("Case not expected, operation = %s" %
2579 2580 operation)
2580 2581
2581 s = difflib.ndiff(re.split(br'(\W)', s2), re.split(br'(\W)', s1))
2582 s = difflib.ndiff(_nonwordre.split(s2), _nonwordre.split(s1))
2582 2583 for part in s:
2583 2584 if part[0] in operation_skip or len(part) == 2:
2584 2585 continue
2585 2586 l = operation + '.highlight'
2586 2587 if part[0] in ' ':
2587 2588 l = operation
2588 2589 if part[2:] == '\t':
2589 2590 l = 'diff.tab'
2590 2591 if l == label: # contiguous token with same label
2591 2592 token += part[2:]
2592 2593 continue
2593 2594 else:
2594 2595 buff.append((token, label))
2595 2596 label = l
2596 2597 token = part[2:]
2597 2598 buff.append((token, label))
2598 2599
2599 2600 return buff
2600 2601
2601 2602 def diffui(*args, **kw):
2602 2603 '''like diff(), but yields 2-tuples of (output, label) for ui.write()'''
2603 2604 return difflabel(diff, *args, **kw)
2604 2605
2605 2606 def _filepairs(modified, added, removed, copy, opts):
2606 2607 '''generates tuples (f1, f2, copyop), where f1 is the name of the file
2607 2608 before and f2 is the the name after. For added files, f1 will be None,
2608 2609 and for removed files, f2 will be None. copyop may be set to None, 'copy'
2609 2610 or 'rename' (the latter two only if opts.git is set).'''
2610 2611 gone = set()
2611 2612
2612 2613 copyto = dict([(v, k) for k, v in copy.items()])
2613 2614
2614 2615 addedset, removedset = set(added), set(removed)
2615 2616
2616 2617 for f in sorted(modified + added + removed):
2617 2618 copyop = None
2618 2619 f1, f2 = f, f
2619 2620 if f in addedset:
2620 2621 f1 = None
2621 2622 if f in copy:
2622 2623 if opts.git:
2623 2624 f1 = copy[f]
2624 2625 if f1 in removedset and f1 not in gone:
2625 2626 copyop = 'rename'
2626 2627 gone.add(f1)
2627 2628 else:
2628 2629 copyop = 'copy'
2629 2630 elif f in removedset:
2630 2631 f2 = None
2631 2632 if opts.git:
2632 2633 # have we already reported a copy above?
2633 2634 if (f in copyto and copyto[f] in addedset
2634 2635 and copy[copyto[f]] == f):
2635 2636 continue
2636 2637 yield f1, f2, copyop
2637 2638
2638 2639 def trydiff(repo, revs, ctx1, ctx2, modified, added, removed,
2639 2640 copy, getfilectx, opts, losedatafn, prefix, relroot):
2640 2641 '''given input data, generate a diff and yield it in blocks
2641 2642
2642 2643 If generating a diff would lose data like flags or binary data and
2643 2644 losedatafn is not None, it will be called.
2644 2645
2645 2646 relroot is removed and prefix is added to every path in the diff output.
2646 2647
2647 2648 If relroot is not empty, this function expects every path in modified,
2648 2649 added, removed and copy to start with it.'''
2649 2650
2650 2651 def gitindex(text):
2651 2652 if not text:
2652 2653 text = ""
2653 2654 l = len(text)
2654 2655 s = hashlib.sha1('blob %d\0' % l)
2655 2656 s.update(text)
2656 2657 return s.hexdigest()
2657 2658
2658 2659 if opts.noprefix:
2659 2660 aprefix = bprefix = ''
2660 2661 else:
2661 2662 aprefix = 'a/'
2662 2663 bprefix = 'b/'
2663 2664
2664 2665 def diffline(f, revs):
2665 2666 revinfo = ' '.join(["-r %s" % rev for rev in revs])
2666 2667 return 'diff %s %s' % (revinfo, f)
2667 2668
2668 2669 def isempty(fctx):
2669 2670 return fctx is None or fctx.size() == 0
2670 2671
2671 2672 date1 = util.datestr(ctx1.date())
2672 2673 date2 = util.datestr(ctx2.date())
2673 2674
2674 2675 gitmode = {'l': '120000', 'x': '100755', '': '100644'}
2675 2676
2676 2677 if relroot != '' and (repo.ui.configbool('devel', 'all-warnings')
2677 2678 or repo.ui.configbool('devel', 'check-relroot')):
2678 2679 for f in modified + added + removed + list(copy) + list(copy.values()):
2679 2680 if f is not None and not f.startswith(relroot):
2680 2681 raise AssertionError(
2681 2682 "file %s doesn't start with relroot %s" % (f, relroot))
2682 2683
2683 2684 for f1, f2, copyop in _filepairs(modified, added, removed, copy, opts):
2684 2685 content1 = None
2685 2686 content2 = None
2686 2687 fctx1 = None
2687 2688 fctx2 = None
2688 2689 flag1 = None
2689 2690 flag2 = None
2690 2691 if f1:
2691 2692 fctx1 = getfilectx(f1, ctx1)
2692 2693 if opts.git or losedatafn:
2693 2694 flag1 = ctx1.flags(f1)
2694 2695 if f2:
2695 2696 fctx2 = getfilectx(f2, ctx2)
2696 2697 if opts.git or losedatafn:
2697 2698 flag2 = ctx2.flags(f2)
2698 2699 # if binary is True, output "summary" or "base85", but not "text diff"
2699 2700 binary = not opts.text and any(f.isbinary()
2700 2701 for f in [fctx1, fctx2] if f is not None)
2701 2702
2702 2703 if losedatafn and not opts.git:
2703 2704 if (binary or
2704 2705 # copy/rename
2705 2706 f2 in copy or
2706 2707 # empty file creation
2707 2708 (not f1 and isempty(fctx2)) or
2708 2709 # empty file deletion
2709 2710 (isempty(fctx1) and not f2) or
2710 2711 # create with flags
2711 2712 (not f1 and flag2) or
2712 2713 # change flags
2713 2714 (f1 and f2 and flag1 != flag2)):
2714 2715 losedatafn(f2 or f1)
2715 2716
2716 2717 path1 = f1 or f2
2717 2718 path2 = f2 or f1
2718 2719 path1 = posixpath.join(prefix, path1[len(relroot):])
2719 2720 path2 = posixpath.join(prefix, path2[len(relroot):])
2720 2721 header = []
2721 2722 if opts.git:
2722 2723 header.append('diff --git %s%s %s%s' %
2723 2724 (aprefix, path1, bprefix, path2))
2724 2725 if not f1: # added
2725 2726 header.append('new file mode %s' % gitmode[flag2])
2726 2727 elif not f2: # removed
2727 2728 header.append('deleted file mode %s' % gitmode[flag1])
2728 2729 else: # modified/copied/renamed
2729 2730 mode1, mode2 = gitmode[flag1], gitmode[flag2]
2730 2731 if mode1 != mode2:
2731 2732 header.append('old mode %s' % mode1)
2732 2733 header.append('new mode %s' % mode2)
2733 2734 if copyop is not None:
2734 2735 if opts.showsimilarity:
2735 2736 sim = similar.score(ctx1[path1], ctx2[path2]) * 100
2736 2737 header.append('similarity index %d%%' % sim)
2737 2738 header.append('%s from %s' % (copyop, path1))
2738 2739 header.append('%s to %s' % (copyop, path2))
2739 2740 elif revs and not repo.ui.quiet:
2740 2741 header.append(diffline(path1, revs))
2741 2742
2742 2743 # fctx.is | diffopts | what to | is fctx.data()
2743 2744 # binary() | text nobinary git index | output? | outputted?
2744 2745 # ------------------------------------|----------------------------
2745 2746 # yes | no no no * | summary | no
2746 2747 # yes | no no yes * | base85 | yes
2747 2748 # yes | no yes no * | summary | no
2748 2749 # yes | no yes yes 0 | summary | no
2749 2750 # yes | no yes yes >0 | summary | semi [1]
2750 2751 # yes | yes * * * | text diff | yes
2751 2752 # no | * * * * | text diff | yes
2752 2753 # [1]: hash(fctx.data()) is outputted. so fctx.data() cannot be faked
2753 2754 if binary and (not opts.git or (opts.git and opts.nobinary and not
2754 2755 opts.index)):
2755 2756 # fast path: no binary content will be displayed, content1 and
2756 2757 # content2 are only used for equivalent test. cmp() could have a
2757 2758 # fast path.
2758 2759 if fctx1 is not None:
2759 2760 content1 = b'\0'
2760 2761 if fctx2 is not None:
2761 2762 if fctx1 is not None and not fctx1.cmp(fctx2):
2762 2763 content2 = b'\0' # not different
2763 2764 else:
2764 2765 content2 = b'\0\0'
2765 2766 else:
2766 2767 # normal path: load contents
2767 2768 if fctx1 is not None:
2768 2769 content1 = fctx1.data()
2769 2770 if fctx2 is not None:
2770 2771 content2 = fctx2.data()
2771 2772
2772 2773 if binary and opts.git and not opts.nobinary:
2773 2774 text = mdiff.b85diff(content1, content2)
2774 2775 if text:
2775 2776 header.append('index %s..%s' %
2776 2777 (gitindex(content1), gitindex(content2)))
2777 2778 hunks = (None, [text]),
2778 2779 else:
2779 2780 if opts.git and opts.index > 0:
2780 2781 flag = flag1
2781 2782 if flag is None:
2782 2783 flag = flag2
2783 2784 header.append('index %s..%s %s' %
2784 2785 (gitindex(content1)[0:opts.index],
2785 2786 gitindex(content2)[0:opts.index],
2786 2787 gitmode[flag]))
2787 2788
2788 2789 uheaders, hunks = mdiff.unidiff(content1, date1,
2789 2790 content2, date2,
2790 2791 path1, path2, opts=opts)
2791 2792 header.extend(uheaders)
2792 2793 yield fctx1, fctx2, header, hunks
2793 2794
2794 2795 def diffstatsum(stats):
2795 2796 maxfile, maxtotal, addtotal, removetotal, binary = 0, 0, 0, 0, False
2796 2797 for f, a, r, b in stats:
2797 2798 maxfile = max(maxfile, encoding.colwidth(f))
2798 2799 maxtotal = max(maxtotal, a + r)
2799 2800 addtotal += a
2800 2801 removetotal += r
2801 2802 binary = binary or b
2802 2803
2803 2804 return maxfile, maxtotal, addtotal, removetotal, binary
2804 2805
2805 2806 def diffstatdata(lines):
2806 2807 diffre = re.compile('^diff .*-r [a-z0-9]+\s(.*)$')
2807 2808
2808 2809 results = []
2809 2810 filename, adds, removes, isbinary = None, 0, 0, False
2810 2811
2811 2812 def addresult():
2812 2813 if filename:
2813 2814 results.append((filename, adds, removes, isbinary))
2814 2815
2815 2816 # inheader is used to track if a line is in the
2816 2817 # header portion of the diff. This helps properly account
2817 2818 # for lines that start with '--' or '++'
2818 2819 inheader = False
2819 2820
2820 2821 for line in lines:
2821 2822 if line.startswith('diff'):
2822 2823 addresult()
2823 2824 # starting a new file diff
2824 2825 # set numbers to 0 and reset inheader
2825 2826 inheader = True
2826 2827 adds, removes, isbinary = 0, 0, False
2827 2828 if line.startswith('diff --git a/'):
2828 2829 filename = gitre.search(line).group(2)
2829 2830 elif line.startswith('diff -r'):
2830 2831 # format: "diff -r ... -r ... filename"
2831 2832 filename = diffre.search(line).group(1)
2832 2833 elif line.startswith('@@'):
2833 2834 inheader = False
2834 2835 elif line.startswith('+') and not inheader:
2835 2836 adds += 1
2836 2837 elif line.startswith('-') and not inheader:
2837 2838 removes += 1
2838 2839 elif (line.startswith('GIT binary patch') or
2839 2840 line.startswith('Binary file')):
2840 2841 isbinary = True
2841 2842 addresult()
2842 2843 return results
2843 2844
2844 2845 def diffstat(lines, width=80):
2845 2846 output = []
2846 2847 stats = diffstatdata(lines)
2847 2848 maxname, maxtotal, totaladds, totalremoves, hasbinary = diffstatsum(stats)
2848 2849
2849 2850 countwidth = len(str(maxtotal))
2850 2851 if hasbinary and countwidth < 3:
2851 2852 countwidth = 3
2852 2853 graphwidth = width - countwidth - maxname - 6
2853 2854 if graphwidth < 10:
2854 2855 graphwidth = 10
2855 2856
2856 2857 def scale(i):
2857 2858 if maxtotal <= graphwidth:
2858 2859 return i
2859 2860 # If diffstat runs out of room it doesn't print anything,
2860 2861 # which isn't very useful, so always print at least one + or -
2861 2862 # if there were at least some changes.
2862 2863 return max(i * graphwidth // maxtotal, int(bool(i)))
2863 2864
2864 2865 for filename, adds, removes, isbinary in stats:
2865 2866 if isbinary:
2866 2867 count = 'Bin'
2867 2868 else:
2868 2869 count = '%d' % (adds + removes)
2869 2870 pluses = '+' * scale(adds)
2870 2871 minuses = '-' * scale(removes)
2871 2872 output.append(' %s%s | %*s %s%s\n' %
2872 2873 (filename, ' ' * (maxname - encoding.colwidth(filename)),
2873 2874 countwidth, count, pluses, minuses))
2874 2875
2875 2876 if stats:
2876 2877 output.append(_(' %d files changed, %d insertions(+), '
2877 2878 '%d deletions(-)\n')
2878 2879 % (len(stats), totaladds, totalremoves))
2879 2880
2880 2881 return ''.join(output)
2881 2882
2882 2883 def diffstatui(*args, **kw):
2883 2884 '''like diffstat(), but yields 2-tuples of (output, label) for
2884 2885 ui.write()
2885 2886 '''
2886 2887
2887 2888 for line in diffstat(*args, **kw).splitlines():
2888 2889 if line and line[-1] in '+-':
2889 2890 name, graph = line.rsplit(' ', 1)
2890 2891 yield (name + ' ', '')
2891 2892 m = re.search(br'\++', graph)
2892 2893 if m:
2893 2894 yield (m.group(0), 'diffstat.inserted')
2894 2895 m = re.search(br'-+', graph)
2895 2896 if m:
2896 2897 yield (m.group(0), 'diffstat.deleted')
2897 2898 else:
2898 2899 yield (line, '')
2899 2900 yield ('\n', '')
@@ -1,372 +1,392 b''
1 1 Setup
2 2
3 3 $ cat <<EOF >> $HGRCPATH
4 4 > [ui]
5 5 > color = yes
6 6 > formatted = always
7 7 > paginate = never
8 8 > [color]
9 9 > mode = ansi
10 10 > EOF
11 11 $ hg init repo
12 12 $ cd repo
13 13 $ cat > a <<EOF
14 14 > c
15 15 > c
16 16 > a
17 17 > a
18 18 > b
19 19 > a
20 20 > a
21 21 > c
22 22 > c
23 23 > EOF
24 24 $ hg ci -Am adda
25 25 adding a
26 26 $ cat > a <<EOF
27 27 > c
28 28 > c
29 29 > a
30 30 > a
31 31 > dd
32 32 > a
33 33 > a
34 34 > c
35 35 > c
36 36 > EOF
37 37
38 38 default context
39 39
40 40 $ hg diff --nodates
41 41 \x1b[0;1mdiff -r cf9f4ba66af2 a\x1b[0m (esc)
42 42 \x1b[0;31;1m--- a/a\x1b[0m (esc)
43 43 \x1b[0;32;1m+++ b/a\x1b[0m (esc)
44 44 \x1b[0;35m@@ -2,7 +2,7 @@\x1b[0m (esc)
45 45 c
46 46 a
47 47 a
48 48 \x1b[0;31m-b\x1b[0m (esc)
49 49 \x1b[0;32m+dd\x1b[0m (esc)
50 50 a
51 51 a
52 52 c
53 53
54 54 (check that 'ui.color=yes' match '--color=auto')
55 55
56 56 $ hg diff --nodates --config ui.formatted=no
57 57 diff -r cf9f4ba66af2 a
58 58 --- a/a
59 59 +++ b/a
60 60 @@ -2,7 +2,7 @@
61 61 c
62 62 a
63 63 a
64 64 -b
65 65 +dd
66 66 a
67 67 a
68 68 c
69 69
70 70 (check that 'ui.color=no' disable color)
71 71
72 72 $ hg diff --nodates --config ui.formatted=yes --config ui.color=no
73 73 diff -r cf9f4ba66af2 a
74 74 --- a/a
75 75 +++ b/a
76 76 @@ -2,7 +2,7 @@
77 77 c
78 78 a
79 79 a
80 80 -b
81 81 +dd
82 82 a
83 83 a
84 84 c
85 85
86 86 (check that 'ui.color=always' force color)
87 87
88 88 $ hg diff --nodates --config ui.formatted=no --config ui.color=always
89 89 \x1b[0;1mdiff -r cf9f4ba66af2 a\x1b[0m (esc)
90 90 \x1b[0;31;1m--- a/a\x1b[0m (esc)
91 91 \x1b[0;32;1m+++ b/a\x1b[0m (esc)
92 92 \x1b[0;35m@@ -2,7 +2,7 @@\x1b[0m (esc)
93 93 c
94 94 a
95 95 a
96 96 \x1b[0;31m-b\x1b[0m (esc)
97 97 \x1b[0;32m+dd\x1b[0m (esc)
98 98 a
99 99 a
100 100 c
101 101
102 102 --unified=2
103 103
104 104 $ hg diff --nodates -U 2
105 105 \x1b[0;1mdiff -r cf9f4ba66af2 a\x1b[0m (esc)
106 106 \x1b[0;31;1m--- a/a\x1b[0m (esc)
107 107 \x1b[0;32;1m+++ b/a\x1b[0m (esc)
108 108 \x1b[0;35m@@ -3,5 +3,5 @@\x1b[0m (esc)
109 109 a
110 110 a
111 111 \x1b[0;31m-b\x1b[0m (esc)
112 112 \x1b[0;32m+dd\x1b[0m (esc)
113 113 a
114 114 a
115 115
116 116 diffstat
117 117
118 118 $ hg diff --stat
119 119 a | 2 \x1b[0;32m+\x1b[0m\x1b[0;31m-\x1b[0m (esc)
120 120 1 files changed, 1 insertions(+), 1 deletions(-)
121 121 $ cat <<EOF >> $HGRCPATH
122 122 > [extensions]
123 123 > record =
124 124 > [ui]
125 125 > interactive = true
126 126 > [diff]
127 127 > git = True
128 128 > EOF
129 129
130 130 #if execbit
131 131
132 132 record
133 133
134 134 $ chmod +x a
135 135 $ hg record -m moda a <<EOF
136 136 > y
137 137 > y
138 138 > EOF
139 139 \x1b[0;1mdiff --git a/a b/a\x1b[0m (esc)
140 140 \x1b[0;36;1mold mode 100644\x1b[0m (esc)
141 141 \x1b[0;36;1mnew mode 100755\x1b[0m (esc)
142 142 1 hunks, 1 lines changed
143 143 \x1b[0;33mexamine changes to 'a'? [Ynesfdaq?]\x1b[0m y (esc)
144 144
145 145 \x1b[0;35m@@ -2,7 +2,7 @@ c\x1b[0m (esc)
146 146 c
147 147 a
148 148 a
149 149 \x1b[0;31m-b\x1b[0m (esc)
150 150 \x1b[0;32m+dd\x1b[0m (esc)
151 151 a
152 152 a
153 153 c
154 154 \x1b[0;33mrecord this change to 'a'? [Ynesfdaq?]\x1b[0m y (esc)
155 155
156 156
157 157 $ echo "[extensions]" >> $HGRCPATH
158 158 $ echo "mq=" >> $HGRCPATH
159 159 $ hg rollback
160 160 repository tip rolled back to revision 0 (undo commit)
161 161 working directory now based on revision 0
162 162
163 163 qrecord
164 164
165 165 $ hg qrecord -m moda patch <<EOF
166 166 > y
167 167 > y
168 168 > EOF
169 169 \x1b[0;1mdiff --git a/a b/a\x1b[0m (esc)
170 170 \x1b[0;36;1mold mode 100644\x1b[0m (esc)
171 171 \x1b[0;36;1mnew mode 100755\x1b[0m (esc)
172 172 1 hunks, 1 lines changed
173 173 \x1b[0;33mexamine changes to 'a'? [Ynesfdaq?]\x1b[0m y (esc)
174 174
175 175 \x1b[0;35m@@ -2,7 +2,7 @@ c\x1b[0m (esc)
176 176 c
177 177 a
178 178 a
179 179 \x1b[0;31m-b\x1b[0m (esc)
180 180 \x1b[0;32m+dd\x1b[0m (esc)
181 181 a
182 182 a
183 183 c
184 184 \x1b[0;33mrecord this change to 'a'? [Ynesfdaq?]\x1b[0m y (esc)
185 185
186 186
187 187 $ hg qpop -a
188 188 popping patch
189 189 patch queue now empty
190 190
191 191 #endif
192 192
193 193 issue3712: test colorization of subrepo diff
194 194
195 195 $ hg init sub
196 196 $ echo b > sub/b
197 197 $ hg -R sub commit -Am 'create sub'
198 198 adding b
199 199 $ echo 'sub = sub' > .hgsub
200 200 $ hg add .hgsub
201 201 $ hg commit -m 'add subrepo sub'
202 202 $ echo aa >> a
203 203 $ echo bb >> sub/b
204 204
205 205 $ hg diff -S
206 206 \x1b[0;1mdiff --git a/a b/a\x1b[0m (esc)
207 207 \x1b[0;31;1m--- a/a\x1b[0m (esc)
208 208 \x1b[0;32;1m+++ b/a\x1b[0m (esc)
209 209 \x1b[0;35m@@ -7,3 +7,4 @@\x1b[0m (esc)
210 210 a
211 211 c
212 212 c
213 213 \x1b[0;32m+aa\x1b[0m (esc)
214 214 \x1b[0;1mdiff --git a/sub/b b/sub/b\x1b[0m (esc)
215 215 \x1b[0;31;1m--- a/sub/b\x1b[0m (esc)
216 216 \x1b[0;32;1m+++ b/sub/b\x1b[0m (esc)
217 217 \x1b[0;35m@@ -1,1 +1,2 @@\x1b[0m (esc)
218 218 b
219 219 \x1b[0;32m+bb\x1b[0m (esc)
220 220
221 221 test tabs
222 222
223 223 $ cat >> a <<EOF
224 224 > one tab
225 225 > two tabs
226 226 > end tab
227 227 > mid tab
228 228 > all tabs
229 229 > EOF
230 230 $ hg diff --nodates
231 231 \x1b[0;1mdiff --git a/a b/a\x1b[0m (esc)
232 232 \x1b[0;31;1m--- a/a\x1b[0m (esc)
233 233 \x1b[0;32;1m+++ b/a\x1b[0m (esc)
234 234 \x1b[0;35m@@ -7,3 +7,9 @@\x1b[0m (esc)
235 235 a
236 236 c
237 237 c
238 238 \x1b[0;32m+aa\x1b[0m (esc)
239 239 \x1b[0;32m+\x1b[0m \x1b[0;32mone tab\x1b[0m (esc)
240 240 \x1b[0;32m+\x1b[0m \x1b[0;32mtwo tabs\x1b[0m (esc)
241 241 \x1b[0;32m+end tab\x1b[0m\x1b[0;1;41m \x1b[0m (esc)
242 242 \x1b[0;32m+mid\x1b[0m \x1b[0;32mtab\x1b[0m (esc)
243 243 \x1b[0;32m+\x1b[0m \x1b[0;32mall\x1b[0m \x1b[0;32mtabs\x1b[0m\x1b[0;1;41m \x1b[0m (esc)
244 244 $ echo "[color]" >> $HGRCPATH
245 245 $ echo "diff.tab = bold magenta" >> $HGRCPATH
246 246 $ hg diff --nodates
247 247 \x1b[0;1mdiff --git a/a b/a\x1b[0m (esc)
248 248 \x1b[0;31;1m--- a/a\x1b[0m (esc)
249 249 \x1b[0;32;1m+++ b/a\x1b[0m (esc)
250 250 \x1b[0;35m@@ -7,3 +7,9 @@\x1b[0m (esc)
251 251 a
252 252 c
253 253 c
254 254 \x1b[0;32m+aa\x1b[0m (esc)
255 255 \x1b[0;32m+\x1b[0m\x1b[0;1;35m \x1b[0m\x1b[0;32mone tab\x1b[0m (esc)
256 256 \x1b[0;32m+\x1b[0m\x1b[0;1;35m \x1b[0m\x1b[0;32mtwo tabs\x1b[0m (esc)
257 257 \x1b[0;32m+end tab\x1b[0m\x1b[0;1;41m \x1b[0m (esc)
258 258 \x1b[0;32m+mid\x1b[0m\x1b[0;1;35m \x1b[0m\x1b[0;32mtab\x1b[0m (esc)
259 259 \x1b[0;32m+\x1b[0m\x1b[0;1;35m \x1b[0m\x1b[0;32mall\x1b[0m\x1b[0;1;35m \x1b[0m\x1b[0;32mtabs\x1b[0m\x1b[0;1;41m \x1b[0m (esc)
260 260
261 261 $ cd ..
262 262
263 263 test inline color diff
264 264
265 265 $ hg init inline
266 266 $ cd inline
267 267 $ cat > file1 << EOF
268 268 > this is the first line
269 269 > this is the second line
270 270 > third line starts with space
271 271 > + starts with a plus sign
272 272 > this one with one tab
273 273 > now with full two tabs
274 274 > now tabs everywhere, much fun
275 275 >
276 276 > this line won't change
277 277 >
278 278 > two lines are going to
279 279 > be changed into three!
280 280 >
281 281 > three of those lines will
282 282 > collapse onto one
283 283 > (to see if it works)
284 284 > EOF
285 285 $ hg add file1
286 286 $ hg ci -m 'commit'
287 287
288 288 $ cat > file1 << EOF
289 289 > that is the first paragraph
290 290 > this is the second line
291 291 > third line starts with space
292 292 > - starts with a minus sign
293 293 > this one with two tab
294 294 > now with full three tabs
295 295 > now there are tabs everywhere, much fun
296 296 >
297 297 > this line won't change
298 298 >
299 299 > two lines are going to
300 300 > (entirely magically,
301 301 > assuming this works)
302 302 > be changed into four!
303 303 >
304 304 > three of those lines have
305 305 > collapsed onto one
306 306 > EOF
307 307 $ hg diff --config experimental.worddiff=False --color=debug
308 308 [diff.diffline|diff --git a/file1 b/file1]
309 309 [diff.file_a|--- a/file1]
310 310 [diff.file_b|+++ b/file1]
311 311 [diff.hunk|@@ -1,16 +1,17 @@]
312 312 [diff.deleted|-this is the first line]
313 313 [diff.deleted|-this is the second line]
314 314 [diff.deleted|- third line starts with space]
315 315 [diff.deleted|-+ starts with a plus sign]
316 316 [diff.deleted|-][diff.tab| ][diff.deleted|this one with one tab]
317 317 [diff.deleted|-][diff.tab| ][diff.deleted|now with full two tabs]
318 318 [diff.deleted|-][diff.tab| ][diff.deleted|now tabs][diff.tab| ][diff.deleted|everywhere, much fun]
319 319 [diff.inserted|+that is the first paragraph]
320 320 [diff.inserted|+ this is the second line]
321 321 [diff.inserted|+third line starts with space]
322 322 [diff.inserted|+- starts with a minus sign]
323 323 [diff.inserted|+][diff.tab| ][diff.inserted|this one with two tab]
324 324 [diff.inserted|+][diff.tab| ][diff.inserted|now with full three tabs]
325 325 [diff.inserted|+][diff.tab| ][diff.inserted|now there are tabs][diff.tab| ][diff.inserted|everywhere, much fun]
326 326
327 327 this line won't change
328 328
329 329 two lines are going to
330 330 [diff.deleted|-be changed into three!]
331 331 [diff.inserted|+(entirely magically,]
332 332 [diff.inserted|+ assuming this works)]
333 333 [diff.inserted|+be changed into four!]
334 334
335 335 [diff.deleted|-three of those lines will]
336 336 [diff.deleted|-collapse onto one]
337 337 [diff.deleted|-(to see if it works)]
338 338 [diff.inserted|+three of those lines have]
339 339 [diff.inserted|+collapsed onto one]
340 340 $ hg diff --config experimental.worddiff=True --color=debug
341 341 [diff.diffline|diff --git a/file1 b/file1]
342 342 [diff.file_a|--- a/file1]
343 343 [diff.file_b|+++ b/file1]
344 344 [diff.hunk|@@ -1,16 +1,17 @@]
345 345 [diff.deleted|-this is the ][diff.deleted.highlight|first][diff.deleted| line]
346 346 [diff.deleted|-this is the second line]
347 347 [diff.deleted|-][diff.deleted.highlight| ][diff.deleted|third line starts with space]
348 348 [diff.deleted|-][diff.deleted.highlight|+][diff.deleted| starts with a ][diff.deleted.highlight|plus][diff.deleted| sign]
349 349 [diff.deleted|-][diff.tab| ][diff.deleted|this one with ][diff.deleted.highlight|one][diff.deleted| tab]
350 350 [diff.deleted|-][diff.tab| ][diff.deleted|now with full ][diff.deleted.highlight|two][diff.deleted| tabs]
351 351 [diff.deleted|-][diff.tab| ][diff.deleted|now tabs][diff.tab| ][diff.deleted|everywhere, much fun]
352 352 [diff.inserted|+that is the first paragraph]
353 353 [diff.inserted|+][diff.inserted.highlight| ][diff.inserted|this is the ][diff.inserted.highlight|second][diff.inserted| line]
354 354 [diff.inserted|+third line starts with space]
355 355 [diff.inserted|+][diff.inserted.highlight|-][diff.inserted| starts with a ][diff.inserted.highlight|minus][diff.inserted| sign]
356 356 [diff.inserted|+][diff.tab| ][diff.inserted|this one with ][diff.inserted.highlight|two][diff.inserted| tab]
357 357 [diff.inserted|+][diff.tab| ][diff.inserted|now with full ][diff.inserted.highlight|three][diff.inserted| tabs]
358 358 [diff.inserted|+][diff.tab| ][diff.inserted|now][diff.inserted.highlight| there are][diff.inserted| tabs][diff.tab| ][diff.inserted|everywhere, much fun]
359 359
360 360 this line won't change
361 361
362 362 two lines are going to
363 363 [diff.deleted|-be changed into ][diff.deleted.highlight|three][diff.deleted|!]
364 364 [diff.inserted|+(entirely magically,]
365 365 [diff.inserted|+ assuming this works)]
366 366 [diff.inserted|+be changed into ][diff.inserted.highlight|four][diff.inserted|!]
367 367
368 368 [diff.deleted|-three of those lines ][diff.deleted.highlight|will]
369 369 [diff.deleted|-][diff.deleted.highlight|collapse][diff.deleted| onto one]
370 370 [diff.deleted|-(to see if it works)]
371 371 [diff.inserted|+three of those lines ][diff.inserted.highlight|have]
372 372 [diff.inserted|+][diff.inserted.highlight|collapsed][diff.inserted| onto one]
373
374 multibyte character shouldn't be broken up in word diff:
375
376 $ $PYTHON <<'EOF'
377 > with open("utf8", "wb") as f:
378 > f.write(b"blah \xe3\x82\xa2 blah\n")
379 > EOF
380 $ hg ci -Am 'add utf8 char' utf8
381 $ $PYTHON <<'EOF'
382 > with open("utf8", "wb") as f:
383 > f.write(b"blah \xe3\x82\xa4 blah\n")
384 > EOF
385 $ hg ci -m 'slightly change utf8 char' utf8
386 $ hg diff --config experimental.worddiff=True --color=debug -c.
387 [diff.diffline|diff --git a/utf8 b/utf8]
388 [diff.file_a|--- a/utf8]
389 [diff.file_b|+++ b/utf8]
390 [diff.hunk|@@ -1,1 +1,1 @@]
391 [diff.deleted|-blah ][diff.deleted.highlight|\xe3\x82\xa2][diff.deleted| blah] (esc)
392 [diff.inserted|+blah ][diff.inserted.highlight|\xe3\x82\xa4][diff.inserted| blah] (esc)
General Comments 0
You need to be logged in to leave comments. Login now