##// END OF EJS Templates
patch: check length of git index header only if integer is specified...
Yuya Nishihara -
r30819:89772662 default
parent child Browse files
Show More
@@ -1,2653 +1,2653 b''
1 1 # patch.py - patch file parsing routines
2 2 #
3 3 # Copyright 2006 Brendan Cully <brendan@kublai.com>
4 4 # Copyright 2007 Chris Mason <chris.mason@oracle.com>
5 5 #
6 6 # This software may be used and distributed according to the terms of the
7 7 # GNU General Public License version 2 or any later version.
8 8
9 9 from __future__ import absolute_import
10 10
11 11 import collections
12 12 import copy
13 13 import email
14 14 import errno
15 15 import hashlib
16 16 import os
17 17 import posixpath
18 18 import re
19 19 import shutil
20 20 import tempfile
21 21 import zlib
22 22
23 23 from .i18n import _
24 24 from .node import (
25 25 hex,
26 26 short,
27 27 )
28 28 from . import (
29 29 base85,
30 30 copies,
31 31 diffhelpers,
32 32 encoding,
33 33 error,
34 34 mail,
35 35 mdiff,
36 36 pathutil,
37 37 scmutil,
38 38 similar,
39 39 util,
40 40 )
41 41 stringio = util.stringio
42 42
43 43 gitre = re.compile('diff --git a/(.*) b/(.*)')
44 44 tabsplitter = re.compile(r'(\t+|[^\t]+)')
45 45
46 46 class PatchError(Exception):
47 47 pass
48 48
49 49
50 50 # public functions
51 51
52 52 def split(stream):
53 53 '''return an iterator of individual patches from a stream'''
54 54 def isheader(line, inheader):
55 55 if inheader and line[0] in (' ', '\t'):
56 56 # continuation
57 57 return True
58 58 if line[0] in (' ', '-', '+'):
59 59 # diff line - don't check for header pattern in there
60 60 return False
61 61 l = line.split(': ', 1)
62 62 return len(l) == 2 and ' ' not in l[0]
63 63
64 64 def chunk(lines):
65 65 return stringio(''.join(lines))
66 66
67 67 def hgsplit(stream, cur):
68 68 inheader = True
69 69
70 70 for line in stream:
71 71 if not line.strip():
72 72 inheader = False
73 73 if not inheader and line.startswith('# HG changeset patch'):
74 74 yield chunk(cur)
75 75 cur = []
76 76 inheader = True
77 77
78 78 cur.append(line)
79 79
80 80 if cur:
81 81 yield chunk(cur)
82 82
83 83 def mboxsplit(stream, cur):
84 84 for line in stream:
85 85 if line.startswith('From '):
86 86 for c in split(chunk(cur[1:])):
87 87 yield c
88 88 cur = []
89 89
90 90 cur.append(line)
91 91
92 92 if cur:
93 93 for c in split(chunk(cur[1:])):
94 94 yield c
95 95
96 96 def mimesplit(stream, cur):
97 97 def msgfp(m):
98 98 fp = stringio()
99 99 g = email.Generator.Generator(fp, mangle_from_=False)
100 100 g.flatten(m)
101 101 fp.seek(0)
102 102 return fp
103 103
104 104 for line in stream:
105 105 cur.append(line)
106 106 c = chunk(cur)
107 107
108 108 m = email.Parser.Parser().parse(c)
109 109 if not m.is_multipart():
110 110 yield msgfp(m)
111 111 else:
112 112 ok_types = ('text/plain', 'text/x-diff', 'text/x-patch')
113 113 for part in m.walk():
114 114 ct = part.get_content_type()
115 115 if ct not in ok_types:
116 116 continue
117 117 yield msgfp(part)
118 118
119 119 def headersplit(stream, cur):
120 120 inheader = False
121 121
122 122 for line in stream:
123 123 if not inheader and isheader(line, inheader):
124 124 yield chunk(cur)
125 125 cur = []
126 126 inheader = True
127 127 if inheader and not isheader(line, inheader):
128 128 inheader = False
129 129
130 130 cur.append(line)
131 131
132 132 if cur:
133 133 yield chunk(cur)
134 134
135 135 def remainder(cur):
136 136 yield chunk(cur)
137 137
138 138 class fiter(object):
139 139 def __init__(self, fp):
140 140 self.fp = fp
141 141
142 142 def __iter__(self):
143 143 return self
144 144
145 145 def next(self):
146 146 l = self.fp.readline()
147 147 if not l:
148 148 raise StopIteration
149 149 return l
150 150
151 151 inheader = False
152 152 cur = []
153 153
154 154 mimeheaders = ['content-type']
155 155
156 156 if not util.safehasattr(stream, 'next'):
157 157 # http responses, for example, have readline but not next
158 158 stream = fiter(stream)
159 159
160 160 for line in stream:
161 161 cur.append(line)
162 162 if line.startswith('# HG changeset patch'):
163 163 return hgsplit(stream, cur)
164 164 elif line.startswith('From '):
165 165 return mboxsplit(stream, cur)
166 166 elif isheader(line, inheader):
167 167 inheader = True
168 168 if line.split(':', 1)[0].lower() in mimeheaders:
169 169 # let email parser handle this
170 170 return mimesplit(stream, cur)
171 171 elif line.startswith('--- ') and inheader:
172 172 # No evil headers seen by diff start, split by hand
173 173 return headersplit(stream, cur)
174 174 # Not enough info, keep reading
175 175
176 176 # if we are here, we have a very plain patch
177 177 return remainder(cur)
178 178
179 179 ## Some facility for extensible patch parsing:
180 180 # list of pairs ("header to match", "data key")
181 181 patchheadermap = [('Date', 'date'),
182 182 ('Branch', 'branch'),
183 183 ('Node ID', 'nodeid'),
184 184 ]
185 185
186 186 def extract(ui, fileobj):
187 187 '''extract patch from data read from fileobj.
188 188
189 189 patch can be a normal patch or contained in an email message.
190 190
191 191 return a dictionary. Standard keys are:
192 192 - filename,
193 193 - message,
194 194 - user,
195 195 - date,
196 196 - branch,
197 197 - node,
198 198 - p1,
199 199 - p2.
200 200 Any item can be missing from the dictionary. If filename is missing,
201 201 fileobj did not contain a patch. Caller must unlink filename when done.'''
202 202
203 203 # attempt to detect the start of a patch
204 204 # (this heuristic is borrowed from quilt)
205 205 diffre = re.compile(r'^(?:Index:[ \t]|diff[ \t]|RCS file: |'
206 206 r'retrieving revision [0-9]+(\.[0-9]+)*$|'
207 207 r'---[ \t].*?^\+\+\+[ \t]|'
208 208 r'\*\*\*[ \t].*?^---[ \t])', re.MULTILINE|re.DOTALL)
209 209
210 210 data = {}
211 211 fd, tmpname = tempfile.mkstemp(prefix='hg-patch-')
212 212 tmpfp = os.fdopen(fd, 'w')
213 213 try:
214 214 msg = email.Parser.Parser().parse(fileobj)
215 215
216 216 subject = msg['Subject'] and mail.headdecode(msg['Subject'])
217 217 data['user'] = msg['From'] and mail.headdecode(msg['From'])
218 218 if not subject and not data['user']:
219 219 # Not an email, restore parsed headers if any
220 220 subject = '\n'.join(': '.join(h) for h in msg.items()) + '\n'
221 221
222 222 # should try to parse msg['Date']
223 223 parents = []
224 224
225 225 if subject:
226 226 if subject.startswith('[PATCH'):
227 227 pend = subject.find(']')
228 228 if pend >= 0:
229 229 subject = subject[pend + 1:].lstrip()
230 230 subject = re.sub(r'\n[ \t]+', ' ', subject)
231 231 ui.debug('Subject: %s\n' % subject)
232 232 if data['user']:
233 233 ui.debug('From: %s\n' % data['user'])
234 234 diffs_seen = 0
235 235 ok_types = ('text/plain', 'text/x-diff', 'text/x-patch')
236 236 message = ''
237 237 for part in msg.walk():
238 238 content_type = part.get_content_type()
239 239 ui.debug('Content-Type: %s\n' % content_type)
240 240 if content_type not in ok_types:
241 241 continue
242 242 payload = part.get_payload(decode=True)
243 243 m = diffre.search(payload)
244 244 if m:
245 245 hgpatch = False
246 246 hgpatchheader = False
247 247 ignoretext = False
248 248
249 249 ui.debug('found patch at byte %d\n' % m.start(0))
250 250 diffs_seen += 1
251 251 cfp = stringio()
252 252 for line in payload[:m.start(0)].splitlines():
253 253 if line.startswith('# HG changeset patch') and not hgpatch:
254 254 ui.debug('patch generated by hg export\n')
255 255 hgpatch = True
256 256 hgpatchheader = True
257 257 # drop earlier commit message content
258 258 cfp.seek(0)
259 259 cfp.truncate()
260 260 subject = None
261 261 elif hgpatchheader:
262 262 if line.startswith('# User '):
263 263 data['user'] = line[7:]
264 264 ui.debug('From: %s\n' % data['user'])
265 265 elif line.startswith("# Parent "):
266 266 parents.append(line[9:].lstrip())
267 267 elif line.startswith("# "):
268 268 for header, key in patchheadermap:
269 269 prefix = '# %s ' % header
270 270 if line.startswith(prefix):
271 271 data[key] = line[len(prefix):]
272 272 else:
273 273 hgpatchheader = False
274 274 elif line == '---':
275 275 ignoretext = True
276 276 if not hgpatchheader and not ignoretext:
277 277 cfp.write(line)
278 278 cfp.write('\n')
279 279 message = cfp.getvalue()
280 280 if tmpfp:
281 281 tmpfp.write(payload)
282 282 if not payload.endswith('\n'):
283 283 tmpfp.write('\n')
284 284 elif not diffs_seen and message and content_type == 'text/plain':
285 285 message += '\n' + payload
286 286 except: # re-raises
287 287 tmpfp.close()
288 288 os.unlink(tmpname)
289 289 raise
290 290
291 291 if subject and not message.startswith(subject):
292 292 message = '%s\n%s' % (subject, message)
293 293 data['message'] = message
294 294 tmpfp.close()
295 295 if parents:
296 296 data['p1'] = parents.pop(0)
297 297 if parents:
298 298 data['p2'] = parents.pop(0)
299 299
300 300 if diffs_seen:
301 301 data['filename'] = tmpname
302 302 else:
303 303 os.unlink(tmpname)
304 304 return data
305 305
306 306 class patchmeta(object):
307 307 """Patched file metadata
308 308
309 309 'op' is the performed operation within ADD, DELETE, RENAME, MODIFY
310 310 or COPY. 'path' is patched file path. 'oldpath' is set to the
311 311 origin file when 'op' is either COPY or RENAME, None otherwise. If
312 312 file mode is changed, 'mode' is a tuple (islink, isexec) where
313 313 'islink' is True if the file is a symlink and 'isexec' is True if
314 314 the file is executable. Otherwise, 'mode' is None.
315 315 """
316 316 def __init__(self, path):
317 317 self.path = path
318 318 self.oldpath = None
319 319 self.mode = None
320 320 self.op = 'MODIFY'
321 321 self.binary = False
322 322
323 323 def setmode(self, mode):
324 324 islink = mode & 0o20000
325 325 isexec = mode & 0o100
326 326 self.mode = (islink, isexec)
327 327
328 328 def copy(self):
329 329 other = patchmeta(self.path)
330 330 other.oldpath = self.oldpath
331 331 other.mode = self.mode
332 332 other.op = self.op
333 333 other.binary = self.binary
334 334 return other
335 335
336 336 def _ispatchinga(self, afile):
337 337 if afile == '/dev/null':
338 338 return self.op == 'ADD'
339 339 return afile == 'a/' + (self.oldpath or self.path)
340 340
341 341 def _ispatchingb(self, bfile):
342 342 if bfile == '/dev/null':
343 343 return self.op == 'DELETE'
344 344 return bfile == 'b/' + self.path
345 345
346 346 def ispatching(self, afile, bfile):
347 347 return self._ispatchinga(afile) and self._ispatchingb(bfile)
348 348
349 349 def __repr__(self):
350 350 return "<patchmeta %s %r>" % (self.op, self.path)
351 351
352 352 def readgitpatch(lr):
353 353 """extract git-style metadata about patches from <patchname>"""
354 354
355 355 # Filter patch for git information
356 356 gp = None
357 357 gitpatches = []
358 358 for line in lr:
359 359 line = line.rstrip(' \r\n')
360 360 if line.startswith('diff --git a/'):
361 361 m = gitre.match(line)
362 362 if m:
363 363 if gp:
364 364 gitpatches.append(gp)
365 365 dst = m.group(2)
366 366 gp = patchmeta(dst)
367 367 elif gp:
368 368 if line.startswith('--- '):
369 369 gitpatches.append(gp)
370 370 gp = None
371 371 continue
372 372 if line.startswith('rename from '):
373 373 gp.op = 'RENAME'
374 374 gp.oldpath = line[12:]
375 375 elif line.startswith('rename to '):
376 376 gp.path = line[10:]
377 377 elif line.startswith('copy from '):
378 378 gp.op = 'COPY'
379 379 gp.oldpath = line[10:]
380 380 elif line.startswith('copy to '):
381 381 gp.path = line[8:]
382 382 elif line.startswith('deleted file'):
383 383 gp.op = 'DELETE'
384 384 elif line.startswith('new file mode '):
385 385 gp.op = 'ADD'
386 386 gp.setmode(int(line[-6:], 8))
387 387 elif line.startswith('new mode '):
388 388 gp.setmode(int(line[-6:], 8))
389 389 elif line.startswith('GIT binary patch'):
390 390 gp.binary = True
391 391 if gp:
392 392 gitpatches.append(gp)
393 393
394 394 return gitpatches
395 395
396 396 class linereader(object):
397 397 # simple class to allow pushing lines back into the input stream
398 398 def __init__(self, fp):
399 399 self.fp = fp
400 400 self.buf = []
401 401
402 402 def push(self, line):
403 403 if line is not None:
404 404 self.buf.append(line)
405 405
406 406 def readline(self):
407 407 if self.buf:
408 408 l = self.buf[0]
409 409 del self.buf[0]
410 410 return l
411 411 return self.fp.readline()
412 412
413 413 def __iter__(self):
414 414 return iter(self.readline, '')
415 415
416 416 class abstractbackend(object):
417 417 def __init__(self, ui):
418 418 self.ui = ui
419 419
420 420 def getfile(self, fname):
421 421 """Return target file data and flags as a (data, (islink,
422 422 isexec)) tuple. Data is None if file is missing/deleted.
423 423 """
424 424 raise NotImplementedError
425 425
426 426 def setfile(self, fname, data, mode, copysource):
427 427 """Write data to target file fname and set its mode. mode is a
428 428 (islink, isexec) tuple. If data is None, the file content should
429 429 be left unchanged. If the file is modified after being copied,
430 430 copysource is set to the original file name.
431 431 """
432 432 raise NotImplementedError
433 433
434 434 def unlink(self, fname):
435 435 """Unlink target file."""
436 436 raise NotImplementedError
437 437
438 438 def writerej(self, fname, failed, total, lines):
439 439 """Write rejected lines for fname. total is the number of hunks
440 440 which failed to apply and total the total number of hunks for this
441 441 files.
442 442 """
443 443 pass
444 444
445 445 def exists(self, fname):
446 446 raise NotImplementedError
447 447
448 448 class fsbackend(abstractbackend):
449 449 def __init__(self, ui, basedir):
450 450 super(fsbackend, self).__init__(ui)
451 451 self.opener = scmutil.opener(basedir)
452 452
453 453 def _join(self, f):
454 454 return os.path.join(self.opener.base, f)
455 455
456 456 def getfile(self, fname):
457 457 if self.opener.islink(fname):
458 458 return (self.opener.readlink(fname), (True, False))
459 459
460 460 isexec = False
461 461 try:
462 462 isexec = self.opener.lstat(fname).st_mode & 0o100 != 0
463 463 except OSError as e:
464 464 if e.errno != errno.ENOENT:
465 465 raise
466 466 try:
467 467 return (self.opener.read(fname), (False, isexec))
468 468 except IOError as e:
469 469 if e.errno != errno.ENOENT:
470 470 raise
471 471 return None, None
472 472
473 473 def setfile(self, fname, data, mode, copysource):
474 474 islink, isexec = mode
475 475 if data is None:
476 476 self.opener.setflags(fname, islink, isexec)
477 477 return
478 478 if islink:
479 479 self.opener.symlink(data, fname)
480 480 else:
481 481 self.opener.write(fname, data)
482 482 if isexec:
483 483 self.opener.setflags(fname, False, True)
484 484
485 485 def unlink(self, fname):
486 486 self.opener.unlinkpath(fname, ignoremissing=True)
487 487
488 488 def writerej(self, fname, failed, total, lines):
489 489 fname = fname + ".rej"
490 490 self.ui.warn(
491 491 _("%d out of %d hunks FAILED -- saving rejects to file %s\n") %
492 492 (failed, total, fname))
493 493 fp = self.opener(fname, 'w')
494 494 fp.writelines(lines)
495 495 fp.close()
496 496
497 497 def exists(self, fname):
498 498 return self.opener.lexists(fname)
499 499
500 500 class workingbackend(fsbackend):
501 501 def __init__(self, ui, repo, similarity):
502 502 super(workingbackend, self).__init__(ui, repo.root)
503 503 self.repo = repo
504 504 self.similarity = similarity
505 505 self.removed = set()
506 506 self.changed = set()
507 507 self.copied = []
508 508
509 509 def _checkknown(self, fname):
510 510 if self.repo.dirstate[fname] == '?' and self.exists(fname):
511 511 raise PatchError(_('cannot patch %s: file is not tracked') % fname)
512 512
513 513 def setfile(self, fname, data, mode, copysource):
514 514 self._checkknown(fname)
515 515 super(workingbackend, self).setfile(fname, data, mode, copysource)
516 516 if copysource is not None:
517 517 self.copied.append((copysource, fname))
518 518 self.changed.add(fname)
519 519
520 520 def unlink(self, fname):
521 521 self._checkknown(fname)
522 522 super(workingbackend, self).unlink(fname)
523 523 self.removed.add(fname)
524 524 self.changed.add(fname)
525 525
526 526 def close(self):
527 527 wctx = self.repo[None]
528 528 changed = set(self.changed)
529 529 for src, dst in self.copied:
530 530 scmutil.dirstatecopy(self.ui, self.repo, wctx, src, dst)
531 531 if self.removed:
532 532 wctx.forget(sorted(self.removed))
533 533 for f in self.removed:
534 534 if f not in self.repo.dirstate:
535 535 # File was deleted and no longer belongs to the
536 536 # dirstate, it was probably marked added then
537 537 # deleted, and should not be considered by
538 538 # marktouched().
539 539 changed.discard(f)
540 540 if changed:
541 541 scmutil.marktouched(self.repo, changed, self.similarity)
542 542 return sorted(self.changed)
543 543
544 544 class filestore(object):
545 545 def __init__(self, maxsize=None):
546 546 self.opener = None
547 547 self.files = {}
548 548 self.created = 0
549 549 self.maxsize = maxsize
550 550 if self.maxsize is None:
551 551 self.maxsize = 4*(2**20)
552 552 self.size = 0
553 553 self.data = {}
554 554
555 555 def setfile(self, fname, data, mode, copied=None):
556 556 if self.maxsize < 0 or (len(data) + self.size) <= self.maxsize:
557 557 self.data[fname] = (data, mode, copied)
558 558 self.size += len(data)
559 559 else:
560 560 if self.opener is None:
561 561 root = tempfile.mkdtemp(prefix='hg-patch-')
562 562 self.opener = scmutil.opener(root)
563 563 # Avoid filename issues with these simple names
564 564 fn = str(self.created)
565 565 self.opener.write(fn, data)
566 566 self.created += 1
567 567 self.files[fname] = (fn, mode, copied)
568 568
569 569 def getfile(self, fname):
570 570 if fname in self.data:
571 571 return self.data[fname]
572 572 if not self.opener or fname not in self.files:
573 573 return None, None, None
574 574 fn, mode, copied = self.files[fname]
575 575 return self.opener.read(fn), mode, copied
576 576
577 577 def close(self):
578 578 if self.opener:
579 579 shutil.rmtree(self.opener.base)
580 580
581 581 class repobackend(abstractbackend):
582 582 def __init__(self, ui, repo, ctx, store):
583 583 super(repobackend, self).__init__(ui)
584 584 self.repo = repo
585 585 self.ctx = ctx
586 586 self.store = store
587 587 self.changed = set()
588 588 self.removed = set()
589 589 self.copied = {}
590 590
591 591 def _checkknown(self, fname):
592 592 if fname not in self.ctx:
593 593 raise PatchError(_('cannot patch %s: file is not tracked') % fname)
594 594
595 595 def getfile(self, fname):
596 596 try:
597 597 fctx = self.ctx[fname]
598 598 except error.LookupError:
599 599 return None, None
600 600 flags = fctx.flags()
601 601 return fctx.data(), ('l' in flags, 'x' in flags)
602 602
603 603 def setfile(self, fname, data, mode, copysource):
604 604 if copysource:
605 605 self._checkknown(copysource)
606 606 if data is None:
607 607 data = self.ctx[fname].data()
608 608 self.store.setfile(fname, data, mode, copysource)
609 609 self.changed.add(fname)
610 610 if copysource:
611 611 self.copied[fname] = copysource
612 612
613 613 def unlink(self, fname):
614 614 self._checkknown(fname)
615 615 self.removed.add(fname)
616 616
617 617 def exists(self, fname):
618 618 return fname in self.ctx
619 619
620 620 def close(self):
621 621 return self.changed | self.removed
622 622
623 623 # @@ -start,len +start,len @@ or @@ -start +start @@ if len is 1
624 624 unidesc = re.compile('@@ -(\d+)(?:,(\d+))? \+(\d+)(?:,(\d+))? @@')
625 625 contextdesc = re.compile('(?:---|\*\*\*) (\d+)(?:,(\d+))? (?:---|\*\*\*)')
626 626 eolmodes = ['strict', 'crlf', 'lf', 'auto']
627 627
628 628 class patchfile(object):
629 629 def __init__(self, ui, gp, backend, store, eolmode='strict'):
630 630 self.fname = gp.path
631 631 self.eolmode = eolmode
632 632 self.eol = None
633 633 self.backend = backend
634 634 self.ui = ui
635 635 self.lines = []
636 636 self.exists = False
637 637 self.missing = True
638 638 self.mode = gp.mode
639 639 self.copysource = gp.oldpath
640 640 self.create = gp.op in ('ADD', 'COPY', 'RENAME')
641 641 self.remove = gp.op == 'DELETE'
642 642 if self.copysource is None:
643 643 data, mode = backend.getfile(self.fname)
644 644 else:
645 645 data, mode = store.getfile(self.copysource)[:2]
646 646 if data is not None:
647 647 self.exists = self.copysource is None or backend.exists(self.fname)
648 648 self.missing = False
649 649 if data:
650 650 self.lines = mdiff.splitnewlines(data)
651 651 if self.mode is None:
652 652 self.mode = mode
653 653 if self.lines:
654 654 # Normalize line endings
655 655 if self.lines[0].endswith('\r\n'):
656 656 self.eol = '\r\n'
657 657 elif self.lines[0].endswith('\n'):
658 658 self.eol = '\n'
659 659 if eolmode != 'strict':
660 660 nlines = []
661 661 for l in self.lines:
662 662 if l.endswith('\r\n'):
663 663 l = l[:-2] + '\n'
664 664 nlines.append(l)
665 665 self.lines = nlines
666 666 else:
667 667 if self.create:
668 668 self.missing = False
669 669 if self.mode is None:
670 670 self.mode = (False, False)
671 671 if self.missing:
672 672 self.ui.warn(_("unable to find '%s' for patching\n") % self.fname)
673 673 self.ui.warn(_("(use '--prefix' to apply patch relative to the "
674 674 "current directory)\n"))
675 675
676 676 self.hash = {}
677 677 self.dirty = 0
678 678 self.offset = 0
679 679 self.skew = 0
680 680 self.rej = []
681 681 self.fileprinted = False
682 682 self.printfile(False)
683 683 self.hunks = 0
684 684
685 685 def writelines(self, fname, lines, mode):
686 686 if self.eolmode == 'auto':
687 687 eol = self.eol
688 688 elif self.eolmode == 'crlf':
689 689 eol = '\r\n'
690 690 else:
691 691 eol = '\n'
692 692
693 693 if self.eolmode != 'strict' and eol and eol != '\n':
694 694 rawlines = []
695 695 for l in lines:
696 696 if l and l[-1] == '\n':
697 697 l = l[:-1] + eol
698 698 rawlines.append(l)
699 699 lines = rawlines
700 700
701 701 self.backend.setfile(fname, ''.join(lines), mode, self.copysource)
702 702
703 703 def printfile(self, warn):
704 704 if self.fileprinted:
705 705 return
706 706 if warn or self.ui.verbose:
707 707 self.fileprinted = True
708 708 s = _("patching file %s\n") % self.fname
709 709 if warn:
710 710 self.ui.warn(s)
711 711 else:
712 712 self.ui.note(s)
713 713
714 714
715 715 def findlines(self, l, linenum):
716 716 # looks through the hash and finds candidate lines. The
717 717 # result is a list of line numbers sorted based on distance
718 718 # from linenum
719 719
720 720 cand = self.hash.get(l, [])
721 721 if len(cand) > 1:
722 722 # resort our list of potentials forward then back.
723 723 cand.sort(key=lambda x: abs(x - linenum))
724 724 return cand
725 725
726 726 def write_rej(self):
727 727 # our rejects are a little different from patch(1). This always
728 728 # creates rejects in the same form as the original patch. A file
729 729 # header is inserted so that you can run the reject through patch again
730 730 # without having to type the filename.
731 731 if not self.rej:
732 732 return
733 733 base = os.path.basename(self.fname)
734 734 lines = ["--- %s\n+++ %s\n" % (base, base)]
735 735 for x in self.rej:
736 736 for l in x.hunk:
737 737 lines.append(l)
738 738 if l[-1] != '\n':
739 739 lines.append("\n\ No newline at end of file\n")
740 740 self.backend.writerej(self.fname, len(self.rej), self.hunks, lines)
741 741
742 742 def apply(self, h):
743 743 if not h.complete():
744 744 raise PatchError(_("bad hunk #%d %s (%d %d %d %d)") %
745 745 (h.number, h.desc, len(h.a), h.lena, len(h.b),
746 746 h.lenb))
747 747
748 748 self.hunks += 1
749 749
750 750 if self.missing:
751 751 self.rej.append(h)
752 752 return -1
753 753
754 754 if self.exists and self.create:
755 755 if self.copysource:
756 756 self.ui.warn(_("cannot create %s: destination already "
757 757 "exists\n") % self.fname)
758 758 else:
759 759 self.ui.warn(_("file %s already exists\n") % self.fname)
760 760 self.rej.append(h)
761 761 return -1
762 762
763 763 if isinstance(h, binhunk):
764 764 if self.remove:
765 765 self.backend.unlink(self.fname)
766 766 else:
767 767 l = h.new(self.lines)
768 768 self.lines[:] = l
769 769 self.offset += len(l)
770 770 self.dirty = True
771 771 return 0
772 772
773 773 horig = h
774 774 if (self.eolmode in ('crlf', 'lf')
775 775 or self.eolmode == 'auto' and self.eol):
776 776 # If new eols are going to be normalized, then normalize
777 777 # hunk data before patching. Otherwise, preserve input
778 778 # line-endings.
779 779 h = h.getnormalized()
780 780
781 781 # fast case first, no offsets, no fuzz
782 782 old, oldstart, new, newstart = h.fuzzit(0, False)
783 783 oldstart += self.offset
784 784 orig_start = oldstart
785 785 # if there's skew we want to emit the "(offset %d lines)" even
786 786 # when the hunk cleanly applies at start + skew, so skip the
787 787 # fast case code
788 788 if (self.skew == 0 and
789 789 diffhelpers.testhunk(old, self.lines, oldstart) == 0):
790 790 if self.remove:
791 791 self.backend.unlink(self.fname)
792 792 else:
793 793 self.lines[oldstart:oldstart + len(old)] = new
794 794 self.offset += len(new) - len(old)
795 795 self.dirty = True
796 796 return 0
797 797
798 798 # ok, we couldn't match the hunk. Lets look for offsets and fuzz it
799 799 self.hash = {}
800 800 for x, s in enumerate(self.lines):
801 801 self.hash.setdefault(s, []).append(x)
802 802
803 803 for fuzzlen in xrange(self.ui.configint("patch", "fuzz", 2) + 1):
804 804 for toponly in [True, False]:
805 805 old, oldstart, new, newstart = h.fuzzit(fuzzlen, toponly)
806 806 oldstart = oldstart + self.offset + self.skew
807 807 oldstart = min(oldstart, len(self.lines))
808 808 if old:
809 809 cand = self.findlines(old[0][1:], oldstart)
810 810 else:
811 811 # Only adding lines with no or fuzzed context, just
812 812 # take the skew in account
813 813 cand = [oldstart]
814 814
815 815 for l in cand:
816 816 if not old or diffhelpers.testhunk(old, self.lines, l) == 0:
817 817 self.lines[l : l + len(old)] = new
818 818 self.offset += len(new) - len(old)
819 819 self.skew = l - orig_start
820 820 self.dirty = True
821 821 offset = l - orig_start - fuzzlen
822 822 if fuzzlen:
823 823 msg = _("Hunk #%d succeeded at %d "
824 824 "with fuzz %d "
825 825 "(offset %d lines).\n")
826 826 self.printfile(True)
827 827 self.ui.warn(msg %
828 828 (h.number, l + 1, fuzzlen, offset))
829 829 else:
830 830 msg = _("Hunk #%d succeeded at %d "
831 831 "(offset %d lines).\n")
832 832 self.ui.note(msg % (h.number, l + 1, offset))
833 833 return fuzzlen
834 834 self.printfile(True)
835 835 self.ui.warn(_("Hunk #%d FAILED at %d\n") % (h.number, orig_start))
836 836 self.rej.append(horig)
837 837 return -1
838 838
839 839 def close(self):
840 840 if self.dirty:
841 841 self.writelines(self.fname, self.lines, self.mode)
842 842 self.write_rej()
843 843 return len(self.rej)
844 844
845 845 class header(object):
846 846 """patch header
847 847 """
848 848 diffgit_re = re.compile('diff --git a/(.*) b/(.*)$')
849 849 diff_re = re.compile('diff -r .* (.*)$')
850 850 allhunks_re = re.compile('(?:index|deleted file) ')
851 851 pretty_re = re.compile('(?:new file|deleted file) ')
852 852 special_re = re.compile('(?:index|deleted|copy|rename) ')
853 853 newfile_re = re.compile('(?:new file)')
854 854
855 855 def __init__(self, header):
856 856 self.header = header
857 857 self.hunks = []
858 858
859 859 def binary(self):
860 860 return any(h.startswith('index ') for h in self.header)
861 861
862 862 def pretty(self, fp):
863 863 for h in self.header:
864 864 if h.startswith('index '):
865 865 fp.write(_('this modifies a binary file (all or nothing)\n'))
866 866 break
867 867 if self.pretty_re.match(h):
868 868 fp.write(h)
869 869 if self.binary():
870 870 fp.write(_('this is a binary file\n'))
871 871 break
872 872 if h.startswith('---'):
873 873 fp.write(_('%d hunks, %d lines changed\n') %
874 874 (len(self.hunks),
875 875 sum([max(h.added, h.removed) for h in self.hunks])))
876 876 break
877 877 fp.write(h)
878 878
879 879 def write(self, fp):
880 880 fp.write(''.join(self.header))
881 881
882 882 def allhunks(self):
883 883 return any(self.allhunks_re.match(h) for h in self.header)
884 884
885 885 def files(self):
886 886 match = self.diffgit_re.match(self.header[0])
887 887 if match:
888 888 fromfile, tofile = match.groups()
889 889 if fromfile == tofile:
890 890 return [fromfile]
891 891 return [fromfile, tofile]
892 892 else:
893 893 return self.diff_re.match(self.header[0]).groups()
894 894
895 895 def filename(self):
896 896 return self.files()[-1]
897 897
898 898 def __repr__(self):
899 899 return '<header %s>' % (' '.join(map(repr, self.files())))
900 900
901 901 def isnewfile(self):
902 902 return any(self.newfile_re.match(h) for h in self.header)
903 903
904 904 def special(self):
905 905 # Special files are shown only at the header level and not at the hunk
906 906 # level for example a file that has been deleted is a special file.
907 907 # The user cannot change the content of the operation, in the case of
908 908 # the deleted file he has to take the deletion or not take it, he
909 909 # cannot take some of it.
910 910 # Newly added files are special if they are empty, they are not special
911 911 # if they have some content as we want to be able to change it
912 912 nocontent = len(self.header) == 2
913 913 emptynewfile = self.isnewfile() and nocontent
914 914 return emptynewfile or \
915 915 any(self.special_re.match(h) for h in self.header)
916 916
917 917 class recordhunk(object):
918 918 """patch hunk
919 919
920 920 XXX shouldn't we merge this with the other hunk class?
921 921 """
922 922 maxcontext = 3
923 923
924 924 def __init__(self, header, fromline, toline, proc, before, hunk, after):
925 925 def trimcontext(number, lines):
926 926 delta = len(lines) - self.maxcontext
927 927 if False and delta > 0:
928 928 return number + delta, lines[:self.maxcontext]
929 929 return number, lines
930 930
931 931 self.header = header
932 932 self.fromline, self.before = trimcontext(fromline, before)
933 933 self.toline, self.after = trimcontext(toline, after)
934 934 self.proc = proc
935 935 self.hunk = hunk
936 936 self.added, self.removed = self.countchanges(self.hunk)
937 937
938 938 def __eq__(self, v):
939 939 if not isinstance(v, recordhunk):
940 940 return False
941 941
942 942 return ((v.hunk == self.hunk) and
943 943 (v.proc == self.proc) and
944 944 (self.fromline == v.fromline) and
945 945 (self.header.files() == v.header.files()))
946 946
947 947 def __hash__(self):
948 948 return hash((tuple(self.hunk),
949 949 tuple(self.header.files()),
950 950 self.fromline,
951 951 self.proc))
952 952
953 953 def countchanges(self, hunk):
954 954 """hunk -> (n+,n-)"""
955 955 add = len([h for h in hunk if h[0] == '+'])
956 956 rem = len([h for h in hunk if h[0] == '-'])
957 957 return add, rem
958 958
959 959 def write(self, fp):
960 960 delta = len(self.before) + len(self.after)
961 961 if self.after and self.after[-1] == '\\ No newline at end of file\n':
962 962 delta -= 1
963 963 fromlen = delta + self.removed
964 964 tolen = delta + self.added
965 965 fp.write('@@ -%d,%d +%d,%d @@%s\n' %
966 966 (self.fromline, fromlen, self.toline, tolen,
967 967 self.proc and (' ' + self.proc)))
968 968 fp.write(''.join(self.before + self.hunk + self.after))
969 969
970 970 pretty = write
971 971
972 972 def filename(self):
973 973 return self.header.filename()
974 974
975 975 def __repr__(self):
976 976 return '<hunk %r@%d>' % (self.filename(), self.fromline)
977 977
978 978 def filterpatch(ui, headers, operation=None):
979 979 """Interactively filter patch chunks into applied-only chunks"""
980 980 if operation is None:
981 981 operation = 'record'
982 982 messages = {
983 983 'multiple': {
984 984 'discard': _("discard change %d/%d to '%s'?"),
985 985 'record': _("record change %d/%d to '%s'?"),
986 986 'revert': _("revert change %d/%d to '%s'?"),
987 987 }[operation],
988 988 'single': {
989 989 'discard': _("discard this change to '%s'?"),
990 990 'record': _("record this change to '%s'?"),
991 991 'revert': _("revert this change to '%s'?"),
992 992 }[operation],
993 993 }
994 994
995 995 def prompt(skipfile, skipall, query, chunk):
996 996 """prompt query, and process base inputs
997 997
998 998 - y/n for the rest of file
999 999 - y/n for the rest
1000 1000 - ? (help)
1001 1001 - q (quit)
1002 1002
1003 1003 Return True/False and possibly updated skipfile and skipall.
1004 1004 """
1005 1005 newpatches = None
1006 1006 if skipall is not None:
1007 1007 return skipall, skipfile, skipall, newpatches
1008 1008 if skipfile is not None:
1009 1009 return skipfile, skipfile, skipall, newpatches
1010 1010 while True:
1011 1011 resps = _('[Ynesfdaq?]'
1012 1012 '$$ &Yes, record this change'
1013 1013 '$$ &No, skip this change'
1014 1014 '$$ &Edit this change manually'
1015 1015 '$$ &Skip remaining changes to this file'
1016 1016 '$$ Record remaining changes to this &file'
1017 1017 '$$ &Done, skip remaining changes and files'
1018 1018 '$$ Record &all changes to all remaining files'
1019 1019 '$$ &Quit, recording no changes'
1020 1020 '$$ &? (display help)')
1021 1021 r = ui.promptchoice("%s %s" % (query, resps))
1022 1022 ui.write("\n")
1023 1023 if r == 8: # ?
1024 1024 for c, t in ui.extractchoices(resps)[1]:
1025 1025 ui.write('%s - %s\n' % (c, encoding.lower(t)))
1026 1026 continue
1027 1027 elif r == 0: # yes
1028 1028 ret = True
1029 1029 elif r == 1: # no
1030 1030 ret = False
1031 1031 elif r == 2: # Edit patch
1032 1032 if chunk is None:
1033 1033 ui.write(_('cannot edit patch for whole file'))
1034 1034 ui.write("\n")
1035 1035 continue
1036 1036 if chunk.header.binary():
1037 1037 ui.write(_('cannot edit patch for binary file'))
1038 1038 ui.write("\n")
1039 1039 continue
1040 1040 # Patch comment based on the Git one (based on comment at end of
1041 1041 # https://mercurial-scm.org/wiki/RecordExtension)
1042 1042 phelp = '---' + _("""
1043 1043 To remove '-' lines, make them ' ' lines (context).
1044 1044 To remove '+' lines, delete them.
1045 1045 Lines starting with # will be removed from the patch.
1046 1046
1047 1047 If the patch applies cleanly, the edited hunk will immediately be
1048 1048 added to the record list. If it does not apply cleanly, a rejects
1049 1049 file will be generated: you can use that when you try again. If
1050 1050 all lines of the hunk are removed, then the edit is aborted and
1051 1051 the hunk is left unchanged.
1052 1052 """)
1053 1053 (patchfd, patchfn) = tempfile.mkstemp(prefix="hg-editor-",
1054 1054 suffix=".diff", text=True)
1055 1055 ncpatchfp = None
1056 1056 try:
1057 1057 # Write the initial patch
1058 1058 f = os.fdopen(patchfd, "w")
1059 1059 chunk.header.write(f)
1060 1060 chunk.write(f)
1061 1061 f.write('\n'.join(['# ' + i for i in phelp.splitlines()]))
1062 1062 f.close()
1063 1063 # Start the editor and wait for it to complete
1064 1064 editor = ui.geteditor()
1065 1065 ret = ui.system("%s \"%s\"" % (editor, patchfn),
1066 1066 environ={'HGUSER': ui.username()})
1067 1067 if ret != 0:
1068 1068 ui.warn(_("editor exited with exit code %d\n") % ret)
1069 1069 continue
1070 1070 # Remove comment lines
1071 1071 patchfp = open(patchfn)
1072 1072 ncpatchfp = stringio()
1073 1073 for line in util.iterfile(patchfp):
1074 1074 if not line.startswith('#'):
1075 1075 ncpatchfp.write(line)
1076 1076 patchfp.close()
1077 1077 ncpatchfp.seek(0)
1078 1078 newpatches = parsepatch(ncpatchfp)
1079 1079 finally:
1080 1080 os.unlink(patchfn)
1081 1081 del ncpatchfp
1082 1082 # Signal that the chunk shouldn't be applied as-is, but
1083 1083 # provide the new patch to be used instead.
1084 1084 ret = False
1085 1085 elif r == 3: # Skip
1086 1086 ret = skipfile = False
1087 1087 elif r == 4: # file (Record remaining)
1088 1088 ret = skipfile = True
1089 1089 elif r == 5: # done, skip remaining
1090 1090 ret = skipall = False
1091 1091 elif r == 6: # all
1092 1092 ret = skipall = True
1093 1093 elif r == 7: # quit
1094 1094 raise error.Abort(_('user quit'))
1095 1095 return ret, skipfile, skipall, newpatches
1096 1096
1097 1097 seen = set()
1098 1098 applied = {} # 'filename' -> [] of chunks
1099 1099 skipfile, skipall = None, None
1100 1100 pos, total = 1, sum(len(h.hunks) for h in headers)
1101 1101 for h in headers:
1102 1102 pos += len(h.hunks)
1103 1103 skipfile = None
1104 1104 fixoffset = 0
1105 1105 hdr = ''.join(h.header)
1106 1106 if hdr in seen:
1107 1107 continue
1108 1108 seen.add(hdr)
1109 1109 if skipall is None:
1110 1110 h.pretty(ui)
1111 1111 msg = (_('examine changes to %s?') %
1112 1112 _(' and ').join("'%s'" % f for f in h.files()))
1113 1113 r, skipfile, skipall, np = prompt(skipfile, skipall, msg, None)
1114 1114 if not r:
1115 1115 continue
1116 1116 applied[h.filename()] = [h]
1117 1117 if h.allhunks():
1118 1118 applied[h.filename()] += h.hunks
1119 1119 continue
1120 1120 for i, chunk in enumerate(h.hunks):
1121 1121 if skipfile is None and skipall is None:
1122 1122 chunk.pretty(ui)
1123 1123 if total == 1:
1124 1124 msg = messages['single'] % chunk.filename()
1125 1125 else:
1126 1126 idx = pos - len(h.hunks) + i
1127 1127 msg = messages['multiple'] % (idx, total, chunk.filename())
1128 1128 r, skipfile, skipall, newpatches = prompt(skipfile,
1129 1129 skipall, msg, chunk)
1130 1130 if r:
1131 1131 if fixoffset:
1132 1132 chunk = copy.copy(chunk)
1133 1133 chunk.toline += fixoffset
1134 1134 applied[chunk.filename()].append(chunk)
1135 1135 elif newpatches is not None:
1136 1136 for newpatch in newpatches:
1137 1137 for newhunk in newpatch.hunks:
1138 1138 if fixoffset:
1139 1139 newhunk.toline += fixoffset
1140 1140 applied[newhunk.filename()].append(newhunk)
1141 1141 else:
1142 1142 fixoffset += chunk.removed - chunk.added
1143 1143 return (sum([h for h in applied.itervalues()
1144 1144 if h[0].special() or len(h) > 1], []), {})
1145 1145 class hunk(object):
1146 1146 def __init__(self, desc, num, lr, context):
1147 1147 self.number = num
1148 1148 self.desc = desc
1149 1149 self.hunk = [desc]
1150 1150 self.a = []
1151 1151 self.b = []
1152 1152 self.starta = self.lena = None
1153 1153 self.startb = self.lenb = None
1154 1154 if lr is not None:
1155 1155 if context:
1156 1156 self.read_context_hunk(lr)
1157 1157 else:
1158 1158 self.read_unified_hunk(lr)
1159 1159
1160 1160 def getnormalized(self):
1161 1161 """Return a copy with line endings normalized to LF."""
1162 1162
1163 1163 def normalize(lines):
1164 1164 nlines = []
1165 1165 for line in lines:
1166 1166 if line.endswith('\r\n'):
1167 1167 line = line[:-2] + '\n'
1168 1168 nlines.append(line)
1169 1169 return nlines
1170 1170
1171 1171 # Dummy object, it is rebuilt manually
1172 1172 nh = hunk(self.desc, self.number, None, None)
1173 1173 nh.number = self.number
1174 1174 nh.desc = self.desc
1175 1175 nh.hunk = self.hunk
1176 1176 nh.a = normalize(self.a)
1177 1177 nh.b = normalize(self.b)
1178 1178 nh.starta = self.starta
1179 1179 nh.startb = self.startb
1180 1180 nh.lena = self.lena
1181 1181 nh.lenb = self.lenb
1182 1182 return nh
1183 1183
1184 1184 def read_unified_hunk(self, lr):
1185 1185 m = unidesc.match(self.desc)
1186 1186 if not m:
1187 1187 raise PatchError(_("bad hunk #%d") % self.number)
1188 1188 self.starta, self.lena, self.startb, self.lenb = m.groups()
1189 1189 if self.lena is None:
1190 1190 self.lena = 1
1191 1191 else:
1192 1192 self.lena = int(self.lena)
1193 1193 if self.lenb is None:
1194 1194 self.lenb = 1
1195 1195 else:
1196 1196 self.lenb = int(self.lenb)
1197 1197 self.starta = int(self.starta)
1198 1198 self.startb = int(self.startb)
1199 1199 diffhelpers.addlines(lr, self.hunk, self.lena, self.lenb, self.a,
1200 1200 self.b)
1201 1201 # if we hit eof before finishing out the hunk, the last line will
1202 1202 # be zero length. Lets try to fix it up.
1203 1203 while len(self.hunk[-1]) == 0:
1204 1204 del self.hunk[-1]
1205 1205 del self.a[-1]
1206 1206 del self.b[-1]
1207 1207 self.lena -= 1
1208 1208 self.lenb -= 1
1209 1209 self._fixnewline(lr)
1210 1210
1211 1211 def read_context_hunk(self, lr):
1212 1212 self.desc = lr.readline()
1213 1213 m = contextdesc.match(self.desc)
1214 1214 if not m:
1215 1215 raise PatchError(_("bad hunk #%d") % self.number)
1216 1216 self.starta, aend = m.groups()
1217 1217 self.starta = int(self.starta)
1218 1218 if aend is None:
1219 1219 aend = self.starta
1220 1220 self.lena = int(aend) - self.starta
1221 1221 if self.starta:
1222 1222 self.lena += 1
1223 1223 for x in xrange(self.lena):
1224 1224 l = lr.readline()
1225 1225 if l.startswith('---'):
1226 1226 # lines addition, old block is empty
1227 1227 lr.push(l)
1228 1228 break
1229 1229 s = l[2:]
1230 1230 if l.startswith('- ') or l.startswith('! '):
1231 1231 u = '-' + s
1232 1232 elif l.startswith(' '):
1233 1233 u = ' ' + s
1234 1234 else:
1235 1235 raise PatchError(_("bad hunk #%d old text line %d") %
1236 1236 (self.number, x))
1237 1237 self.a.append(u)
1238 1238 self.hunk.append(u)
1239 1239
1240 1240 l = lr.readline()
1241 1241 if l.startswith('\ '):
1242 1242 s = self.a[-1][:-1]
1243 1243 self.a[-1] = s
1244 1244 self.hunk[-1] = s
1245 1245 l = lr.readline()
1246 1246 m = contextdesc.match(l)
1247 1247 if not m:
1248 1248 raise PatchError(_("bad hunk #%d") % self.number)
1249 1249 self.startb, bend = m.groups()
1250 1250 self.startb = int(self.startb)
1251 1251 if bend is None:
1252 1252 bend = self.startb
1253 1253 self.lenb = int(bend) - self.startb
1254 1254 if self.startb:
1255 1255 self.lenb += 1
1256 1256 hunki = 1
1257 1257 for x in xrange(self.lenb):
1258 1258 l = lr.readline()
1259 1259 if l.startswith('\ '):
1260 1260 # XXX: the only way to hit this is with an invalid line range.
1261 1261 # The no-eol marker is not counted in the line range, but I
1262 1262 # guess there are diff(1) out there which behave differently.
1263 1263 s = self.b[-1][:-1]
1264 1264 self.b[-1] = s
1265 1265 self.hunk[hunki - 1] = s
1266 1266 continue
1267 1267 if not l:
1268 1268 # line deletions, new block is empty and we hit EOF
1269 1269 lr.push(l)
1270 1270 break
1271 1271 s = l[2:]
1272 1272 if l.startswith('+ ') or l.startswith('! '):
1273 1273 u = '+' + s
1274 1274 elif l.startswith(' '):
1275 1275 u = ' ' + s
1276 1276 elif len(self.b) == 0:
1277 1277 # line deletions, new block is empty
1278 1278 lr.push(l)
1279 1279 break
1280 1280 else:
1281 1281 raise PatchError(_("bad hunk #%d old text line %d") %
1282 1282 (self.number, x))
1283 1283 self.b.append(s)
1284 1284 while True:
1285 1285 if hunki >= len(self.hunk):
1286 1286 h = ""
1287 1287 else:
1288 1288 h = self.hunk[hunki]
1289 1289 hunki += 1
1290 1290 if h == u:
1291 1291 break
1292 1292 elif h.startswith('-'):
1293 1293 continue
1294 1294 else:
1295 1295 self.hunk.insert(hunki - 1, u)
1296 1296 break
1297 1297
1298 1298 if not self.a:
1299 1299 # this happens when lines were only added to the hunk
1300 1300 for x in self.hunk:
1301 1301 if x.startswith('-') or x.startswith(' '):
1302 1302 self.a.append(x)
1303 1303 if not self.b:
1304 1304 # this happens when lines were only deleted from the hunk
1305 1305 for x in self.hunk:
1306 1306 if x.startswith('+') or x.startswith(' '):
1307 1307 self.b.append(x[1:])
1308 1308 # @@ -start,len +start,len @@
1309 1309 self.desc = "@@ -%d,%d +%d,%d @@\n" % (self.starta, self.lena,
1310 1310 self.startb, self.lenb)
1311 1311 self.hunk[0] = self.desc
1312 1312 self._fixnewline(lr)
1313 1313
1314 1314 def _fixnewline(self, lr):
1315 1315 l = lr.readline()
1316 1316 if l.startswith('\ '):
1317 1317 diffhelpers.fix_newline(self.hunk, self.a, self.b)
1318 1318 else:
1319 1319 lr.push(l)
1320 1320
1321 1321 def complete(self):
1322 1322 return len(self.a) == self.lena and len(self.b) == self.lenb
1323 1323
1324 1324 def _fuzzit(self, old, new, fuzz, toponly):
1325 1325 # this removes context lines from the top and bottom of list 'l'. It
1326 1326 # checks the hunk to make sure only context lines are removed, and then
1327 1327 # returns a new shortened list of lines.
1328 1328 fuzz = min(fuzz, len(old))
1329 1329 if fuzz:
1330 1330 top = 0
1331 1331 bot = 0
1332 1332 hlen = len(self.hunk)
1333 1333 for x in xrange(hlen - 1):
1334 1334 # the hunk starts with the @@ line, so use x+1
1335 1335 if self.hunk[x + 1][0] == ' ':
1336 1336 top += 1
1337 1337 else:
1338 1338 break
1339 1339 if not toponly:
1340 1340 for x in xrange(hlen - 1):
1341 1341 if self.hunk[hlen - bot - 1][0] == ' ':
1342 1342 bot += 1
1343 1343 else:
1344 1344 break
1345 1345
1346 1346 bot = min(fuzz, bot)
1347 1347 top = min(fuzz, top)
1348 1348 return old[top:len(old) - bot], new[top:len(new) - bot], top
1349 1349 return old, new, 0
1350 1350
1351 1351 def fuzzit(self, fuzz, toponly):
1352 1352 old, new, top = self._fuzzit(self.a, self.b, fuzz, toponly)
1353 1353 oldstart = self.starta + top
1354 1354 newstart = self.startb + top
1355 1355 # zero length hunk ranges already have their start decremented
1356 1356 if self.lena and oldstart > 0:
1357 1357 oldstart -= 1
1358 1358 if self.lenb and newstart > 0:
1359 1359 newstart -= 1
1360 1360 return old, oldstart, new, newstart
1361 1361
1362 1362 class binhunk(object):
1363 1363 'A binary patch file.'
1364 1364 def __init__(self, lr, fname):
1365 1365 self.text = None
1366 1366 self.delta = False
1367 1367 self.hunk = ['GIT binary patch\n']
1368 1368 self._fname = fname
1369 1369 self._read(lr)
1370 1370
1371 1371 def complete(self):
1372 1372 return self.text is not None
1373 1373
1374 1374 def new(self, lines):
1375 1375 if self.delta:
1376 1376 return [applybindelta(self.text, ''.join(lines))]
1377 1377 return [self.text]
1378 1378
1379 1379 def _read(self, lr):
1380 1380 def getline(lr, hunk):
1381 1381 l = lr.readline()
1382 1382 hunk.append(l)
1383 1383 return l.rstrip('\r\n')
1384 1384
1385 1385 size = 0
1386 1386 while True:
1387 1387 line = getline(lr, self.hunk)
1388 1388 if not line:
1389 1389 raise PatchError(_('could not extract "%s" binary data')
1390 1390 % self._fname)
1391 1391 if line.startswith('literal '):
1392 1392 size = int(line[8:].rstrip())
1393 1393 break
1394 1394 if line.startswith('delta '):
1395 1395 size = int(line[6:].rstrip())
1396 1396 self.delta = True
1397 1397 break
1398 1398 dec = []
1399 1399 line = getline(lr, self.hunk)
1400 1400 while len(line) > 1:
1401 1401 l = line[0]
1402 1402 if l <= 'Z' and l >= 'A':
1403 1403 l = ord(l) - ord('A') + 1
1404 1404 else:
1405 1405 l = ord(l) - ord('a') + 27
1406 1406 try:
1407 1407 dec.append(base85.b85decode(line[1:])[:l])
1408 1408 except ValueError as e:
1409 1409 raise PatchError(_('could not decode "%s" binary patch: %s')
1410 1410 % (self._fname, str(e)))
1411 1411 line = getline(lr, self.hunk)
1412 1412 text = zlib.decompress(''.join(dec))
1413 1413 if len(text) != size:
1414 1414 raise PatchError(_('"%s" length is %d bytes, should be %d')
1415 1415 % (self._fname, len(text), size))
1416 1416 self.text = text
1417 1417
1418 1418 def parsefilename(str):
1419 1419 # --- filename \t|space stuff
1420 1420 s = str[4:].rstrip('\r\n')
1421 1421 i = s.find('\t')
1422 1422 if i < 0:
1423 1423 i = s.find(' ')
1424 1424 if i < 0:
1425 1425 return s
1426 1426 return s[:i]
1427 1427
1428 1428 def reversehunks(hunks):
1429 1429 '''reverse the signs in the hunks given as argument
1430 1430
1431 1431 This function operates on hunks coming out of patch.filterpatch, that is
1432 1432 a list of the form: [header1, hunk1, hunk2, header2...]. Example usage:
1433 1433
1434 1434 >>> rawpatch = """diff --git a/folder1/g b/folder1/g
1435 1435 ... --- a/folder1/g
1436 1436 ... +++ b/folder1/g
1437 1437 ... @@ -1,7 +1,7 @@
1438 1438 ... +firstline
1439 1439 ... c
1440 1440 ... 1
1441 1441 ... 2
1442 1442 ... + 3
1443 1443 ... -4
1444 1444 ... 5
1445 1445 ... d
1446 1446 ... +lastline"""
1447 1447 >>> hunks = parsepatch(rawpatch)
1448 1448 >>> hunkscomingfromfilterpatch = []
1449 1449 >>> for h in hunks:
1450 1450 ... hunkscomingfromfilterpatch.append(h)
1451 1451 ... hunkscomingfromfilterpatch.extend(h.hunks)
1452 1452
1453 1453 >>> reversedhunks = reversehunks(hunkscomingfromfilterpatch)
1454 1454 >>> from . import util
1455 1455 >>> fp = util.stringio()
1456 1456 >>> for c in reversedhunks:
1457 1457 ... c.write(fp)
1458 1458 >>> fp.seek(0)
1459 1459 >>> reversedpatch = fp.read()
1460 1460 >>> print reversedpatch
1461 1461 diff --git a/folder1/g b/folder1/g
1462 1462 --- a/folder1/g
1463 1463 +++ b/folder1/g
1464 1464 @@ -1,4 +1,3 @@
1465 1465 -firstline
1466 1466 c
1467 1467 1
1468 1468 2
1469 1469 @@ -1,6 +2,6 @@
1470 1470 c
1471 1471 1
1472 1472 2
1473 1473 - 3
1474 1474 +4
1475 1475 5
1476 1476 d
1477 1477 @@ -5,3 +6,2 @@
1478 1478 5
1479 1479 d
1480 1480 -lastline
1481 1481
1482 1482 '''
1483 1483
1484 1484 from . import crecord as crecordmod
1485 1485 newhunks = []
1486 1486 for c in hunks:
1487 1487 if isinstance(c, crecordmod.uihunk):
1488 1488 # curses hunks encapsulate the record hunk in _hunk
1489 1489 c = c._hunk
1490 1490 if isinstance(c, recordhunk):
1491 1491 for j, line in enumerate(c.hunk):
1492 1492 if line.startswith("-"):
1493 1493 c.hunk[j] = "+" + c.hunk[j][1:]
1494 1494 elif line.startswith("+"):
1495 1495 c.hunk[j] = "-" + c.hunk[j][1:]
1496 1496 c.added, c.removed = c.removed, c.added
1497 1497 newhunks.append(c)
1498 1498 return newhunks
1499 1499
1500 1500 def parsepatch(originalchunks):
1501 1501 """patch -> [] of headers -> [] of hunks """
1502 1502 class parser(object):
1503 1503 """patch parsing state machine"""
1504 1504 def __init__(self):
1505 1505 self.fromline = 0
1506 1506 self.toline = 0
1507 1507 self.proc = ''
1508 1508 self.header = None
1509 1509 self.context = []
1510 1510 self.before = []
1511 1511 self.hunk = []
1512 1512 self.headers = []
1513 1513
1514 1514 def addrange(self, limits):
1515 1515 fromstart, fromend, tostart, toend, proc = limits
1516 1516 self.fromline = int(fromstart)
1517 1517 self.toline = int(tostart)
1518 1518 self.proc = proc
1519 1519
1520 1520 def addcontext(self, context):
1521 1521 if self.hunk:
1522 1522 h = recordhunk(self.header, self.fromline, self.toline,
1523 1523 self.proc, self.before, self.hunk, context)
1524 1524 self.header.hunks.append(h)
1525 1525 self.fromline += len(self.before) + h.removed
1526 1526 self.toline += len(self.before) + h.added
1527 1527 self.before = []
1528 1528 self.hunk = []
1529 1529 self.context = context
1530 1530
1531 1531 def addhunk(self, hunk):
1532 1532 if self.context:
1533 1533 self.before = self.context
1534 1534 self.context = []
1535 1535 self.hunk = hunk
1536 1536
1537 1537 def newfile(self, hdr):
1538 1538 self.addcontext([])
1539 1539 h = header(hdr)
1540 1540 self.headers.append(h)
1541 1541 self.header = h
1542 1542
1543 1543 def addother(self, line):
1544 1544 pass # 'other' lines are ignored
1545 1545
1546 1546 def finished(self):
1547 1547 self.addcontext([])
1548 1548 return self.headers
1549 1549
1550 1550 transitions = {
1551 1551 'file': {'context': addcontext,
1552 1552 'file': newfile,
1553 1553 'hunk': addhunk,
1554 1554 'range': addrange},
1555 1555 'context': {'file': newfile,
1556 1556 'hunk': addhunk,
1557 1557 'range': addrange,
1558 1558 'other': addother},
1559 1559 'hunk': {'context': addcontext,
1560 1560 'file': newfile,
1561 1561 'range': addrange},
1562 1562 'range': {'context': addcontext,
1563 1563 'hunk': addhunk},
1564 1564 'other': {'other': addother},
1565 1565 }
1566 1566
1567 1567 p = parser()
1568 1568 fp = stringio()
1569 1569 fp.write(''.join(originalchunks))
1570 1570 fp.seek(0)
1571 1571
1572 1572 state = 'context'
1573 1573 for newstate, data in scanpatch(fp):
1574 1574 try:
1575 1575 p.transitions[state][newstate](p, data)
1576 1576 except KeyError:
1577 1577 raise PatchError('unhandled transition: %s -> %s' %
1578 1578 (state, newstate))
1579 1579 state = newstate
1580 1580 del fp
1581 1581 return p.finished()
1582 1582
1583 1583 def pathtransform(path, strip, prefix):
1584 1584 '''turn a path from a patch into a path suitable for the repository
1585 1585
1586 1586 prefix, if not empty, is expected to be normalized with a / at the end.
1587 1587
1588 1588 Returns (stripped components, path in repository).
1589 1589
1590 1590 >>> pathtransform('a/b/c', 0, '')
1591 1591 ('', 'a/b/c')
1592 1592 >>> pathtransform(' a/b/c ', 0, '')
1593 1593 ('', ' a/b/c')
1594 1594 >>> pathtransform(' a/b/c ', 2, '')
1595 1595 ('a/b/', 'c')
1596 1596 >>> pathtransform('a/b/c', 0, 'd/e/')
1597 1597 ('', 'd/e/a/b/c')
1598 1598 >>> pathtransform(' a//b/c ', 2, 'd/e/')
1599 1599 ('a//b/', 'd/e/c')
1600 1600 >>> pathtransform('a/b/c', 3, '')
1601 1601 Traceback (most recent call last):
1602 1602 PatchError: unable to strip away 1 of 3 dirs from a/b/c
1603 1603 '''
1604 1604 pathlen = len(path)
1605 1605 i = 0
1606 1606 if strip == 0:
1607 1607 return '', prefix + path.rstrip()
1608 1608 count = strip
1609 1609 while count > 0:
1610 1610 i = path.find('/', i)
1611 1611 if i == -1:
1612 1612 raise PatchError(_("unable to strip away %d of %d dirs from %s") %
1613 1613 (count, strip, path))
1614 1614 i += 1
1615 1615 # consume '//' in the path
1616 1616 while i < pathlen - 1 and path[i] == '/':
1617 1617 i += 1
1618 1618 count -= 1
1619 1619 return path[:i].lstrip(), prefix + path[i:].rstrip()
1620 1620
1621 1621 def makepatchmeta(backend, afile_orig, bfile_orig, hunk, strip, prefix):
1622 1622 nulla = afile_orig == "/dev/null"
1623 1623 nullb = bfile_orig == "/dev/null"
1624 1624 create = nulla and hunk.starta == 0 and hunk.lena == 0
1625 1625 remove = nullb and hunk.startb == 0 and hunk.lenb == 0
1626 1626 abase, afile = pathtransform(afile_orig, strip, prefix)
1627 1627 gooda = not nulla and backend.exists(afile)
1628 1628 bbase, bfile = pathtransform(bfile_orig, strip, prefix)
1629 1629 if afile == bfile:
1630 1630 goodb = gooda
1631 1631 else:
1632 1632 goodb = not nullb and backend.exists(bfile)
1633 1633 missing = not goodb and not gooda and not create
1634 1634
1635 1635 # some diff programs apparently produce patches where the afile is
1636 1636 # not /dev/null, but afile starts with bfile
1637 1637 abasedir = afile[:afile.rfind('/') + 1]
1638 1638 bbasedir = bfile[:bfile.rfind('/') + 1]
1639 1639 if (missing and abasedir == bbasedir and afile.startswith(bfile)
1640 1640 and hunk.starta == 0 and hunk.lena == 0):
1641 1641 create = True
1642 1642 missing = False
1643 1643
1644 1644 # If afile is "a/b/foo" and bfile is "a/b/foo.orig" we assume the
1645 1645 # diff is between a file and its backup. In this case, the original
1646 1646 # file should be patched (see original mpatch code).
1647 1647 isbackup = (abase == bbase and bfile.startswith(afile))
1648 1648 fname = None
1649 1649 if not missing:
1650 1650 if gooda and goodb:
1651 1651 if isbackup:
1652 1652 fname = afile
1653 1653 else:
1654 1654 fname = bfile
1655 1655 elif gooda:
1656 1656 fname = afile
1657 1657
1658 1658 if not fname:
1659 1659 if not nullb:
1660 1660 if isbackup:
1661 1661 fname = afile
1662 1662 else:
1663 1663 fname = bfile
1664 1664 elif not nulla:
1665 1665 fname = afile
1666 1666 else:
1667 1667 raise PatchError(_("undefined source and destination files"))
1668 1668
1669 1669 gp = patchmeta(fname)
1670 1670 if create:
1671 1671 gp.op = 'ADD'
1672 1672 elif remove:
1673 1673 gp.op = 'DELETE'
1674 1674 return gp
1675 1675
1676 1676 def scanpatch(fp):
1677 1677 """like patch.iterhunks, but yield different events
1678 1678
1679 1679 - ('file', [header_lines + fromfile + tofile])
1680 1680 - ('context', [context_lines])
1681 1681 - ('hunk', [hunk_lines])
1682 1682 - ('range', (-start,len, +start,len, proc))
1683 1683 """
1684 1684 lines_re = re.compile(r'@@ -(\d+),(\d+) \+(\d+),(\d+) @@\s*(.*)')
1685 1685 lr = linereader(fp)
1686 1686
1687 1687 def scanwhile(first, p):
1688 1688 """scan lr while predicate holds"""
1689 1689 lines = [first]
1690 1690 for line in iter(lr.readline, ''):
1691 1691 if p(line):
1692 1692 lines.append(line)
1693 1693 else:
1694 1694 lr.push(line)
1695 1695 break
1696 1696 return lines
1697 1697
1698 1698 for line in iter(lr.readline, ''):
1699 1699 if line.startswith('diff --git a/') or line.startswith('diff -r '):
1700 1700 def notheader(line):
1701 1701 s = line.split(None, 1)
1702 1702 return not s or s[0] not in ('---', 'diff')
1703 1703 header = scanwhile(line, notheader)
1704 1704 fromfile = lr.readline()
1705 1705 if fromfile.startswith('---'):
1706 1706 tofile = lr.readline()
1707 1707 header += [fromfile, tofile]
1708 1708 else:
1709 1709 lr.push(fromfile)
1710 1710 yield 'file', header
1711 1711 elif line[0] == ' ':
1712 1712 yield 'context', scanwhile(line, lambda l: l[0] in ' \\')
1713 1713 elif line[0] in '-+':
1714 1714 yield 'hunk', scanwhile(line, lambda l: l[0] in '-+\\')
1715 1715 else:
1716 1716 m = lines_re.match(line)
1717 1717 if m:
1718 1718 yield 'range', m.groups()
1719 1719 else:
1720 1720 yield 'other', line
1721 1721
1722 1722 def scangitpatch(lr, firstline):
1723 1723 """
1724 1724 Git patches can emit:
1725 1725 - rename a to b
1726 1726 - change b
1727 1727 - copy a to c
1728 1728 - change c
1729 1729
1730 1730 We cannot apply this sequence as-is, the renamed 'a' could not be
1731 1731 found for it would have been renamed already. And we cannot copy
1732 1732 from 'b' instead because 'b' would have been changed already. So
1733 1733 we scan the git patch for copy and rename commands so we can
1734 1734 perform the copies ahead of time.
1735 1735 """
1736 1736 pos = 0
1737 1737 try:
1738 1738 pos = lr.fp.tell()
1739 1739 fp = lr.fp
1740 1740 except IOError:
1741 1741 fp = stringio(lr.fp.read())
1742 1742 gitlr = linereader(fp)
1743 1743 gitlr.push(firstline)
1744 1744 gitpatches = readgitpatch(gitlr)
1745 1745 fp.seek(pos)
1746 1746 return gitpatches
1747 1747
1748 1748 def iterhunks(fp):
1749 1749 """Read a patch and yield the following events:
1750 1750 - ("file", afile, bfile, firsthunk): select a new target file.
1751 1751 - ("hunk", hunk): a new hunk is ready to be applied, follows a
1752 1752 "file" event.
1753 1753 - ("git", gitchanges): current diff is in git format, gitchanges
1754 1754 maps filenames to gitpatch records. Unique event.
1755 1755 """
1756 1756 afile = ""
1757 1757 bfile = ""
1758 1758 state = None
1759 1759 hunknum = 0
1760 1760 emitfile = newfile = False
1761 1761 gitpatches = None
1762 1762
1763 1763 # our states
1764 1764 BFILE = 1
1765 1765 context = None
1766 1766 lr = linereader(fp)
1767 1767
1768 1768 for x in iter(lr.readline, ''):
1769 1769 if state == BFILE and (
1770 1770 (not context and x[0] == '@')
1771 1771 or (context is not False and x.startswith('***************'))
1772 1772 or x.startswith('GIT binary patch')):
1773 1773 gp = None
1774 1774 if (gitpatches and
1775 1775 gitpatches[-1].ispatching(afile, bfile)):
1776 1776 gp = gitpatches.pop()
1777 1777 if x.startswith('GIT binary patch'):
1778 1778 h = binhunk(lr, gp.path)
1779 1779 else:
1780 1780 if context is None and x.startswith('***************'):
1781 1781 context = True
1782 1782 h = hunk(x, hunknum + 1, lr, context)
1783 1783 hunknum += 1
1784 1784 if emitfile:
1785 1785 emitfile = False
1786 1786 yield 'file', (afile, bfile, h, gp and gp.copy() or None)
1787 1787 yield 'hunk', h
1788 1788 elif x.startswith('diff --git a/'):
1789 1789 m = gitre.match(x.rstrip(' \r\n'))
1790 1790 if not m:
1791 1791 continue
1792 1792 if gitpatches is None:
1793 1793 # scan whole input for git metadata
1794 1794 gitpatches = scangitpatch(lr, x)
1795 1795 yield 'git', [g.copy() for g in gitpatches
1796 1796 if g.op in ('COPY', 'RENAME')]
1797 1797 gitpatches.reverse()
1798 1798 afile = 'a/' + m.group(1)
1799 1799 bfile = 'b/' + m.group(2)
1800 1800 while gitpatches and not gitpatches[-1].ispatching(afile, bfile):
1801 1801 gp = gitpatches.pop()
1802 1802 yield 'file', ('a/' + gp.path, 'b/' + gp.path, None, gp.copy())
1803 1803 if not gitpatches:
1804 1804 raise PatchError(_('failed to synchronize metadata for "%s"')
1805 1805 % afile[2:])
1806 1806 gp = gitpatches[-1]
1807 1807 newfile = True
1808 1808 elif x.startswith('---'):
1809 1809 # check for a unified diff
1810 1810 l2 = lr.readline()
1811 1811 if not l2.startswith('+++'):
1812 1812 lr.push(l2)
1813 1813 continue
1814 1814 newfile = True
1815 1815 context = False
1816 1816 afile = parsefilename(x)
1817 1817 bfile = parsefilename(l2)
1818 1818 elif x.startswith('***'):
1819 1819 # check for a context diff
1820 1820 l2 = lr.readline()
1821 1821 if not l2.startswith('---'):
1822 1822 lr.push(l2)
1823 1823 continue
1824 1824 l3 = lr.readline()
1825 1825 lr.push(l3)
1826 1826 if not l3.startswith("***************"):
1827 1827 lr.push(l2)
1828 1828 continue
1829 1829 newfile = True
1830 1830 context = True
1831 1831 afile = parsefilename(x)
1832 1832 bfile = parsefilename(l2)
1833 1833
1834 1834 if newfile:
1835 1835 newfile = False
1836 1836 emitfile = True
1837 1837 state = BFILE
1838 1838 hunknum = 0
1839 1839
1840 1840 while gitpatches:
1841 1841 gp = gitpatches.pop()
1842 1842 yield 'file', ('a/' + gp.path, 'b/' + gp.path, None, gp.copy())
1843 1843
1844 1844 def applybindelta(binchunk, data):
1845 1845 """Apply a binary delta hunk
1846 1846 The algorithm used is the algorithm from git's patch-delta.c
1847 1847 """
1848 1848 def deltahead(binchunk):
1849 1849 i = 0
1850 1850 for c in binchunk:
1851 1851 i += 1
1852 1852 if not (ord(c) & 0x80):
1853 1853 return i
1854 1854 return i
1855 1855 out = ""
1856 1856 s = deltahead(binchunk)
1857 1857 binchunk = binchunk[s:]
1858 1858 s = deltahead(binchunk)
1859 1859 binchunk = binchunk[s:]
1860 1860 i = 0
1861 1861 while i < len(binchunk):
1862 1862 cmd = ord(binchunk[i])
1863 1863 i += 1
1864 1864 if (cmd & 0x80):
1865 1865 offset = 0
1866 1866 size = 0
1867 1867 if (cmd & 0x01):
1868 1868 offset = ord(binchunk[i])
1869 1869 i += 1
1870 1870 if (cmd & 0x02):
1871 1871 offset |= ord(binchunk[i]) << 8
1872 1872 i += 1
1873 1873 if (cmd & 0x04):
1874 1874 offset |= ord(binchunk[i]) << 16
1875 1875 i += 1
1876 1876 if (cmd & 0x08):
1877 1877 offset |= ord(binchunk[i]) << 24
1878 1878 i += 1
1879 1879 if (cmd & 0x10):
1880 1880 size = ord(binchunk[i])
1881 1881 i += 1
1882 1882 if (cmd & 0x20):
1883 1883 size |= ord(binchunk[i]) << 8
1884 1884 i += 1
1885 1885 if (cmd & 0x40):
1886 1886 size |= ord(binchunk[i]) << 16
1887 1887 i += 1
1888 1888 if size == 0:
1889 1889 size = 0x10000
1890 1890 offset_end = offset + size
1891 1891 out += data[offset:offset_end]
1892 1892 elif cmd != 0:
1893 1893 offset_end = i + cmd
1894 1894 out += binchunk[i:offset_end]
1895 1895 i += cmd
1896 1896 else:
1897 1897 raise PatchError(_('unexpected delta opcode 0'))
1898 1898 return out
1899 1899
1900 1900 def applydiff(ui, fp, backend, store, strip=1, prefix='', eolmode='strict'):
1901 1901 """Reads a patch from fp and tries to apply it.
1902 1902
1903 1903 Returns 0 for a clean patch, -1 if any rejects were found and 1 if
1904 1904 there was any fuzz.
1905 1905
1906 1906 If 'eolmode' is 'strict', the patch content and patched file are
1907 1907 read in binary mode. Otherwise, line endings are ignored when
1908 1908 patching then normalized according to 'eolmode'.
1909 1909 """
1910 1910 return _applydiff(ui, fp, patchfile, backend, store, strip=strip,
1911 1911 prefix=prefix, eolmode=eolmode)
1912 1912
1913 1913 def _applydiff(ui, fp, patcher, backend, store, strip=1, prefix='',
1914 1914 eolmode='strict'):
1915 1915
1916 1916 if prefix:
1917 1917 prefix = pathutil.canonpath(backend.repo.root, backend.repo.getcwd(),
1918 1918 prefix)
1919 1919 if prefix != '':
1920 1920 prefix += '/'
1921 1921 def pstrip(p):
1922 1922 return pathtransform(p, strip - 1, prefix)[1]
1923 1923
1924 1924 rejects = 0
1925 1925 err = 0
1926 1926 current_file = None
1927 1927
1928 1928 for state, values in iterhunks(fp):
1929 1929 if state == 'hunk':
1930 1930 if not current_file:
1931 1931 continue
1932 1932 ret = current_file.apply(values)
1933 1933 if ret > 0:
1934 1934 err = 1
1935 1935 elif state == 'file':
1936 1936 if current_file:
1937 1937 rejects += current_file.close()
1938 1938 current_file = None
1939 1939 afile, bfile, first_hunk, gp = values
1940 1940 if gp:
1941 1941 gp.path = pstrip(gp.path)
1942 1942 if gp.oldpath:
1943 1943 gp.oldpath = pstrip(gp.oldpath)
1944 1944 else:
1945 1945 gp = makepatchmeta(backend, afile, bfile, first_hunk, strip,
1946 1946 prefix)
1947 1947 if gp.op == 'RENAME':
1948 1948 backend.unlink(gp.oldpath)
1949 1949 if not first_hunk:
1950 1950 if gp.op == 'DELETE':
1951 1951 backend.unlink(gp.path)
1952 1952 continue
1953 1953 data, mode = None, None
1954 1954 if gp.op in ('RENAME', 'COPY'):
1955 1955 data, mode = store.getfile(gp.oldpath)[:2]
1956 1956 if data is None:
1957 1957 # This means that the old path does not exist
1958 1958 raise PatchError(_("source file '%s' does not exist")
1959 1959 % gp.oldpath)
1960 1960 if gp.mode:
1961 1961 mode = gp.mode
1962 1962 if gp.op == 'ADD':
1963 1963 # Added files without content have no hunk and
1964 1964 # must be created
1965 1965 data = ''
1966 1966 if data or mode:
1967 1967 if (gp.op in ('ADD', 'RENAME', 'COPY')
1968 1968 and backend.exists(gp.path)):
1969 1969 raise PatchError(_("cannot create %s: destination "
1970 1970 "already exists") % gp.path)
1971 1971 backend.setfile(gp.path, data, mode, gp.oldpath)
1972 1972 continue
1973 1973 try:
1974 1974 current_file = patcher(ui, gp, backend, store,
1975 1975 eolmode=eolmode)
1976 1976 except PatchError as inst:
1977 1977 ui.warn(str(inst) + '\n')
1978 1978 current_file = None
1979 1979 rejects += 1
1980 1980 continue
1981 1981 elif state == 'git':
1982 1982 for gp in values:
1983 1983 path = pstrip(gp.oldpath)
1984 1984 data, mode = backend.getfile(path)
1985 1985 if data is None:
1986 1986 # The error ignored here will trigger a getfile()
1987 1987 # error in a place more appropriate for error
1988 1988 # handling, and will not interrupt the patching
1989 1989 # process.
1990 1990 pass
1991 1991 else:
1992 1992 store.setfile(path, data, mode)
1993 1993 else:
1994 1994 raise error.Abort(_('unsupported parser state: %s') % state)
1995 1995
1996 1996 if current_file:
1997 1997 rejects += current_file.close()
1998 1998
1999 1999 if rejects:
2000 2000 return -1
2001 2001 return err
2002 2002
2003 2003 def _externalpatch(ui, repo, patcher, patchname, strip, files,
2004 2004 similarity):
2005 2005 """use <patcher> to apply <patchname> to the working directory.
2006 2006 returns whether patch was applied with fuzz factor."""
2007 2007
2008 2008 fuzz = False
2009 2009 args = []
2010 2010 cwd = repo.root
2011 2011 if cwd:
2012 2012 args.append('-d %s' % util.shellquote(cwd))
2013 2013 fp = util.popen('%s %s -p%d < %s' % (patcher, ' '.join(args), strip,
2014 2014 util.shellquote(patchname)))
2015 2015 try:
2016 2016 for line in util.iterfile(fp):
2017 2017 line = line.rstrip()
2018 2018 ui.note(line + '\n')
2019 2019 if line.startswith('patching file '):
2020 2020 pf = util.parsepatchoutput(line)
2021 2021 printed_file = False
2022 2022 files.add(pf)
2023 2023 elif line.find('with fuzz') >= 0:
2024 2024 fuzz = True
2025 2025 if not printed_file:
2026 2026 ui.warn(pf + '\n')
2027 2027 printed_file = True
2028 2028 ui.warn(line + '\n')
2029 2029 elif line.find('saving rejects to file') >= 0:
2030 2030 ui.warn(line + '\n')
2031 2031 elif line.find('FAILED') >= 0:
2032 2032 if not printed_file:
2033 2033 ui.warn(pf + '\n')
2034 2034 printed_file = True
2035 2035 ui.warn(line + '\n')
2036 2036 finally:
2037 2037 if files:
2038 2038 scmutil.marktouched(repo, files, similarity)
2039 2039 code = fp.close()
2040 2040 if code:
2041 2041 raise PatchError(_("patch command failed: %s") %
2042 2042 util.explainexit(code)[0])
2043 2043 return fuzz
2044 2044
2045 2045 def patchbackend(ui, backend, patchobj, strip, prefix, files=None,
2046 2046 eolmode='strict'):
2047 2047 if files is None:
2048 2048 files = set()
2049 2049 if eolmode is None:
2050 2050 eolmode = ui.config('patch', 'eol', 'strict')
2051 2051 if eolmode.lower() not in eolmodes:
2052 2052 raise error.Abort(_('unsupported line endings type: %s') % eolmode)
2053 2053 eolmode = eolmode.lower()
2054 2054
2055 2055 store = filestore()
2056 2056 try:
2057 2057 fp = open(patchobj, 'rb')
2058 2058 except TypeError:
2059 2059 fp = patchobj
2060 2060 try:
2061 2061 ret = applydiff(ui, fp, backend, store, strip=strip, prefix=prefix,
2062 2062 eolmode=eolmode)
2063 2063 finally:
2064 2064 if fp != patchobj:
2065 2065 fp.close()
2066 2066 files.update(backend.close())
2067 2067 store.close()
2068 2068 if ret < 0:
2069 2069 raise PatchError(_('patch failed to apply'))
2070 2070 return ret > 0
2071 2071
2072 2072 def internalpatch(ui, repo, patchobj, strip, prefix='', files=None,
2073 2073 eolmode='strict', similarity=0):
2074 2074 """use builtin patch to apply <patchobj> to the working directory.
2075 2075 returns whether patch was applied with fuzz factor."""
2076 2076 backend = workingbackend(ui, repo, similarity)
2077 2077 return patchbackend(ui, backend, patchobj, strip, prefix, files, eolmode)
2078 2078
2079 2079 def patchrepo(ui, repo, ctx, store, patchobj, strip, prefix, files=None,
2080 2080 eolmode='strict'):
2081 2081 backend = repobackend(ui, repo, ctx, store)
2082 2082 return patchbackend(ui, backend, patchobj, strip, prefix, files, eolmode)
2083 2083
2084 2084 def patch(ui, repo, patchname, strip=1, prefix='', files=None, eolmode='strict',
2085 2085 similarity=0):
2086 2086 """Apply <patchname> to the working directory.
2087 2087
2088 2088 'eolmode' specifies how end of lines should be handled. It can be:
2089 2089 - 'strict': inputs are read in binary mode, EOLs are preserved
2090 2090 - 'crlf': EOLs are ignored when patching and reset to CRLF
2091 2091 - 'lf': EOLs are ignored when patching and reset to LF
2092 2092 - None: get it from user settings, default to 'strict'
2093 2093 'eolmode' is ignored when using an external patcher program.
2094 2094
2095 2095 Returns whether patch was applied with fuzz factor.
2096 2096 """
2097 2097 patcher = ui.config('ui', 'patch')
2098 2098 if files is None:
2099 2099 files = set()
2100 2100 if patcher:
2101 2101 return _externalpatch(ui, repo, patcher, patchname, strip,
2102 2102 files, similarity)
2103 2103 return internalpatch(ui, repo, patchname, strip, prefix, files, eolmode,
2104 2104 similarity)
2105 2105
2106 2106 def changedfiles(ui, repo, patchpath, strip=1):
2107 2107 backend = fsbackend(ui, repo.root)
2108 2108 with open(patchpath, 'rb') as fp:
2109 2109 changed = set()
2110 2110 for state, values in iterhunks(fp):
2111 2111 if state == 'file':
2112 2112 afile, bfile, first_hunk, gp = values
2113 2113 if gp:
2114 2114 gp.path = pathtransform(gp.path, strip - 1, '')[1]
2115 2115 if gp.oldpath:
2116 2116 gp.oldpath = pathtransform(gp.oldpath, strip - 1, '')[1]
2117 2117 else:
2118 2118 gp = makepatchmeta(backend, afile, bfile, first_hunk, strip,
2119 2119 '')
2120 2120 changed.add(gp.path)
2121 2121 if gp.op == 'RENAME':
2122 2122 changed.add(gp.oldpath)
2123 2123 elif state not in ('hunk', 'git'):
2124 2124 raise error.Abort(_('unsupported parser state: %s') % state)
2125 2125 return changed
2126 2126
2127 2127 class GitDiffRequired(Exception):
2128 2128 pass
2129 2129
2130 2130 def diffallopts(ui, opts=None, untrusted=False, section='diff'):
2131 2131 '''return diffopts with all features supported and parsed'''
2132 2132 return difffeatureopts(ui, opts=opts, untrusted=untrusted, section=section,
2133 2133 git=True, whitespace=True, formatchanging=True)
2134 2134
2135 2135 diffopts = diffallopts
2136 2136
2137 2137 def difffeatureopts(ui, opts=None, untrusted=False, section='diff', git=False,
2138 2138 whitespace=False, formatchanging=False):
2139 2139 '''return diffopts with only opted-in features parsed
2140 2140
2141 2141 Features:
2142 2142 - git: git-style diffs
2143 2143 - whitespace: whitespace options like ignoreblanklines and ignorews
2144 2144 - formatchanging: options that will likely break or cause correctness issues
2145 2145 with most diff parsers
2146 2146 '''
2147 2147 def get(key, name=None, getter=ui.configbool, forceplain=None):
2148 2148 if opts:
2149 2149 v = opts.get(key)
2150 2150 # diffopts flags are either None-default (which is passed
2151 2151 # through unchanged, so we can identify unset values), or
2152 2152 # some other falsey default (eg --unified, which defaults
2153 2153 # to an empty string). We only want to override the config
2154 2154 # entries from hgrc with command line values if they
2155 2155 # appear to have been set, which is any truthy value,
2156 2156 # True, or False.
2157 2157 if v or isinstance(v, bool):
2158 2158 return v
2159 2159 if forceplain is not None and ui.plain():
2160 2160 return forceplain
2161 2161 return getter(section, name or key, None, untrusted=untrusted)
2162 2162
2163 2163 # core options, expected to be understood by every diff parser
2164 2164 buildopts = {
2165 2165 'nodates': get('nodates'),
2166 2166 'showfunc': get('show_function', 'showfunc'),
2167 2167 'context': get('unified', getter=ui.config),
2168 2168 }
2169 2169
2170 2170 if git:
2171 2171 buildopts['git'] = get('git')
2172 2172
2173 2173 # since this is in the experimental section, we need to call
2174 2174 # ui.configbool directory
2175 2175 buildopts['showsimilarity'] = ui.configbool('experimental',
2176 2176 'extendedheader.similarity')
2177 2177
2178 2178 # need to inspect the ui object instead of using get() since we want to
2179 2179 # test for an int
2180 2180 hconf = ui.config('experimental', 'extendedheader.index')
2181 2181 if hconf is not None:
2182 2182 hlen = None
2183 2183 try:
2184 2184 # the hash config could be an integer (for length of hash) or a
2185 2185 # word (e.g. short, full, none)
2186 2186 hlen = int(hconf)
2187 if hlen < 0 or hlen > 40:
2188 msg = _("invalid length for extendedheader.index: '%d'\n")
2189 ui.warn(msg % hlen)
2187 2190 except ValueError:
2188 2191 # default value
2189 2192 if hconf == 'short' or hconf == '':
2190 2193 hlen = 12
2191 2194 elif hconf == 'full':
2192 2195 hlen = 40
2193 2196 elif hconf != 'none':
2194 2197 msg = _("invalid value for extendedheader.index: '%s'\n")
2195 2198 ui.warn(msg % hconf)
2196 2199 finally:
2197 if hlen < 0 or hlen > 40:
2198 msg = _("invalid length for extendedheader.index: '%d'\n")
2199 ui.warn(msg % hlen)
2200 2200 buildopts['index'] = hlen
2201 2201
2202 2202 if whitespace:
2203 2203 buildopts['ignorews'] = get('ignore_all_space', 'ignorews')
2204 2204 buildopts['ignorewsamount'] = get('ignore_space_change',
2205 2205 'ignorewsamount')
2206 2206 buildopts['ignoreblanklines'] = get('ignore_blank_lines',
2207 2207 'ignoreblanklines')
2208 2208 if formatchanging:
2209 2209 buildopts['text'] = opts and opts.get('text')
2210 2210 buildopts['nobinary'] = get('nobinary', forceplain=False)
2211 2211 buildopts['noprefix'] = get('noprefix', forceplain=False)
2212 2212
2213 2213 return mdiff.diffopts(**buildopts)
2214 2214
2215 2215 def diff(repo, node1=None, node2=None, match=None, changes=None, opts=None,
2216 2216 losedatafn=None, prefix='', relroot='', copy=None):
2217 2217 '''yields diff of changes to files between two nodes, or node and
2218 2218 working directory.
2219 2219
2220 2220 if node1 is None, use first dirstate parent instead.
2221 2221 if node2 is None, compare node1 with working directory.
2222 2222
2223 2223 losedatafn(**kwarg) is a callable run when opts.upgrade=True and
2224 2224 every time some change cannot be represented with the current
2225 2225 patch format. Return False to upgrade to git patch format, True to
2226 2226 accept the loss or raise an exception to abort the diff. It is
2227 2227 called with the name of current file being diffed as 'fn'. If set
2228 2228 to None, patches will always be upgraded to git format when
2229 2229 necessary.
2230 2230
2231 2231 prefix is a filename prefix that is prepended to all filenames on
2232 2232 display (used for subrepos).
2233 2233
2234 2234 relroot, if not empty, must be normalized with a trailing /. Any match
2235 2235 patterns that fall outside it will be ignored.
2236 2236
2237 2237 copy, if not empty, should contain mappings {dst@y: src@x} of copy
2238 2238 information.'''
2239 2239
2240 2240 if opts is None:
2241 2241 opts = mdiff.defaultopts
2242 2242
2243 2243 if not node1 and not node2:
2244 2244 node1 = repo.dirstate.p1()
2245 2245
2246 2246 def lrugetfilectx():
2247 2247 cache = {}
2248 2248 order = collections.deque()
2249 2249 def getfilectx(f, ctx):
2250 2250 fctx = ctx.filectx(f, filelog=cache.get(f))
2251 2251 if f not in cache:
2252 2252 if len(cache) > 20:
2253 2253 del cache[order.popleft()]
2254 2254 cache[f] = fctx.filelog()
2255 2255 else:
2256 2256 order.remove(f)
2257 2257 order.append(f)
2258 2258 return fctx
2259 2259 return getfilectx
2260 2260 getfilectx = lrugetfilectx()
2261 2261
2262 2262 ctx1 = repo[node1]
2263 2263 ctx2 = repo[node2]
2264 2264
2265 2265 relfiltered = False
2266 2266 if relroot != '' and match.always():
2267 2267 # as a special case, create a new matcher with just the relroot
2268 2268 pats = [relroot]
2269 2269 match = scmutil.match(ctx2, pats, default='path')
2270 2270 relfiltered = True
2271 2271
2272 2272 if not changes:
2273 2273 changes = repo.status(ctx1, ctx2, match=match)
2274 2274 modified, added, removed = changes[:3]
2275 2275
2276 2276 if not modified and not added and not removed:
2277 2277 return []
2278 2278
2279 2279 if repo.ui.debugflag:
2280 2280 hexfunc = hex
2281 2281 else:
2282 2282 hexfunc = short
2283 2283 revs = [hexfunc(node) for node in [ctx1.node(), ctx2.node()] if node]
2284 2284
2285 2285 if copy is None:
2286 2286 copy = {}
2287 2287 if opts.git or opts.upgrade:
2288 2288 copy = copies.pathcopies(ctx1, ctx2, match=match)
2289 2289
2290 2290 if relroot is not None:
2291 2291 if not relfiltered:
2292 2292 # XXX this would ideally be done in the matcher, but that is
2293 2293 # generally meant to 'or' patterns, not 'and' them. In this case we
2294 2294 # need to 'and' all the patterns from the matcher with relroot.
2295 2295 def filterrel(l):
2296 2296 return [f for f in l if f.startswith(relroot)]
2297 2297 modified = filterrel(modified)
2298 2298 added = filterrel(added)
2299 2299 removed = filterrel(removed)
2300 2300 relfiltered = True
2301 2301 # filter out copies where either side isn't inside the relative root
2302 2302 copy = dict(((dst, src) for (dst, src) in copy.iteritems()
2303 2303 if dst.startswith(relroot)
2304 2304 and src.startswith(relroot)))
2305 2305
2306 2306 modifiedset = set(modified)
2307 2307 addedset = set(added)
2308 2308 removedset = set(removed)
2309 2309 for f in modified:
2310 2310 if f not in ctx1:
2311 2311 # Fix up added, since merged-in additions appear as
2312 2312 # modifications during merges
2313 2313 modifiedset.remove(f)
2314 2314 addedset.add(f)
2315 2315 for f in removed:
2316 2316 if f not in ctx1:
2317 2317 # Merged-in additions that are then removed are reported as removed.
2318 2318 # They are not in ctx1, so We don't want to show them in the diff.
2319 2319 removedset.remove(f)
2320 2320 modified = sorted(modifiedset)
2321 2321 added = sorted(addedset)
2322 2322 removed = sorted(removedset)
2323 2323 for dst, src in copy.items():
2324 2324 if src not in ctx1:
2325 2325 # Files merged in during a merge and then copied/renamed are
2326 2326 # reported as copies. We want to show them in the diff as additions.
2327 2327 del copy[dst]
2328 2328
2329 2329 def difffn(opts, losedata):
2330 2330 return trydiff(repo, revs, ctx1, ctx2, modified, added, removed,
2331 2331 copy, getfilectx, opts, losedata, prefix, relroot)
2332 2332 if opts.upgrade and not opts.git:
2333 2333 try:
2334 2334 def losedata(fn):
2335 2335 if not losedatafn or not losedatafn(fn=fn):
2336 2336 raise GitDiffRequired
2337 2337 # Buffer the whole output until we are sure it can be generated
2338 2338 return list(difffn(opts.copy(git=False), losedata))
2339 2339 except GitDiffRequired:
2340 2340 return difffn(opts.copy(git=True), None)
2341 2341 else:
2342 2342 return difffn(opts, None)
2343 2343
2344 2344 def difflabel(func, *args, **kw):
2345 2345 '''yields 2-tuples of (output, label) based on the output of func()'''
2346 2346 headprefixes = [('diff', 'diff.diffline'),
2347 2347 ('copy', 'diff.extended'),
2348 2348 ('rename', 'diff.extended'),
2349 2349 ('old', 'diff.extended'),
2350 2350 ('new', 'diff.extended'),
2351 2351 ('deleted', 'diff.extended'),
2352 2352 ('index', 'diff.extended'),
2353 2353 ('similarity', 'diff.extended'),
2354 2354 ('---', 'diff.file_a'),
2355 2355 ('+++', 'diff.file_b')]
2356 2356 textprefixes = [('@', 'diff.hunk'),
2357 2357 ('-', 'diff.deleted'),
2358 2358 ('+', 'diff.inserted')]
2359 2359 head = False
2360 2360 for chunk in func(*args, **kw):
2361 2361 lines = chunk.split('\n')
2362 2362 for i, line in enumerate(lines):
2363 2363 if i != 0:
2364 2364 yield ('\n', '')
2365 2365 if head:
2366 2366 if line.startswith('@'):
2367 2367 head = False
2368 2368 else:
2369 2369 if line and line[0] not in ' +-@\\':
2370 2370 head = True
2371 2371 stripline = line
2372 2372 diffline = False
2373 2373 if not head and line and line[0] in '+-':
2374 2374 # highlight tabs and trailing whitespace, but only in
2375 2375 # changed lines
2376 2376 stripline = line.rstrip()
2377 2377 diffline = True
2378 2378
2379 2379 prefixes = textprefixes
2380 2380 if head:
2381 2381 prefixes = headprefixes
2382 2382 for prefix, label in prefixes:
2383 2383 if stripline.startswith(prefix):
2384 2384 if diffline:
2385 2385 for token in tabsplitter.findall(stripline):
2386 2386 if '\t' == token[0]:
2387 2387 yield (token, 'diff.tab')
2388 2388 else:
2389 2389 yield (token, label)
2390 2390 else:
2391 2391 yield (stripline, label)
2392 2392 break
2393 2393 else:
2394 2394 yield (line, '')
2395 2395 if line != stripline:
2396 2396 yield (line[len(stripline):], 'diff.trailingwhitespace')
2397 2397
2398 2398 def diffui(*args, **kw):
2399 2399 '''like diff(), but yields 2-tuples of (output, label) for ui.write()'''
2400 2400 return difflabel(diff, *args, **kw)
2401 2401
2402 2402 def _filepairs(modified, added, removed, copy, opts):
2403 2403 '''generates tuples (f1, f2, copyop), where f1 is the name of the file
2404 2404 before and f2 is the the name after. For added files, f1 will be None,
2405 2405 and for removed files, f2 will be None. copyop may be set to None, 'copy'
2406 2406 or 'rename' (the latter two only if opts.git is set).'''
2407 2407 gone = set()
2408 2408
2409 2409 copyto = dict([(v, k) for k, v in copy.items()])
2410 2410
2411 2411 addedset, removedset = set(added), set(removed)
2412 2412
2413 2413 for f in sorted(modified + added + removed):
2414 2414 copyop = None
2415 2415 f1, f2 = f, f
2416 2416 if f in addedset:
2417 2417 f1 = None
2418 2418 if f in copy:
2419 2419 if opts.git:
2420 2420 f1 = copy[f]
2421 2421 if f1 in removedset and f1 not in gone:
2422 2422 copyop = 'rename'
2423 2423 gone.add(f1)
2424 2424 else:
2425 2425 copyop = 'copy'
2426 2426 elif f in removedset:
2427 2427 f2 = None
2428 2428 if opts.git:
2429 2429 # have we already reported a copy above?
2430 2430 if (f in copyto and copyto[f] in addedset
2431 2431 and copy[copyto[f]] == f):
2432 2432 continue
2433 2433 yield f1, f2, copyop
2434 2434
2435 2435 def trydiff(repo, revs, ctx1, ctx2, modified, added, removed,
2436 2436 copy, getfilectx, opts, losedatafn, prefix, relroot):
2437 2437 '''given input data, generate a diff and yield it in blocks
2438 2438
2439 2439 If generating a diff would lose data like flags or binary data and
2440 2440 losedatafn is not None, it will be called.
2441 2441
2442 2442 relroot is removed and prefix is added to every path in the diff output.
2443 2443
2444 2444 If relroot is not empty, this function expects every path in modified,
2445 2445 added, removed and copy to start with it.'''
2446 2446
2447 2447 def gitindex(text):
2448 2448 if not text:
2449 2449 text = ""
2450 2450 l = len(text)
2451 2451 s = hashlib.sha1('blob %d\0' % l)
2452 2452 s.update(text)
2453 2453 return s.hexdigest()
2454 2454
2455 2455 if opts.noprefix:
2456 2456 aprefix = bprefix = ''
2457 2457 else:
2458 2458 aprefix = 'a/'
2459 2459 bprefix = 'b/'
2460 2460
2461 2461 def diffline(f, revs):
2462 2462 revinfo = ' '.join(["-r %s" % rev for rev in revs])
2463 2463 return 'diff %s %s' % (revinfo, f)
2464 2464
2465 2465 date1 = util.datestr(ctx1.date())
2466 2466 date2 = util.datestr(ctx2.date())
2467 2467
2468 2468 gitmode = {'l': '120000', 'x': '100755', '': '100644'}
2469 2469
2470 2470 if relroot != '' and (repo.ui.configbool('devel', 'all')
2471 2471 or repo.ui.configbool('devel', 'check-relroot')):
2472 2472 for f in modified + added + removed + copy.keys() + copy.values():
2473 2473 if f is not None and not f.startswith(relroot):
2474 2474 raise AssertionError(
2475 2475 "file %s doesn't start with relroot %s" % (f, relroot))
2476 2476
2477 2477 for f1, f2, copyop in _filepairs(modified, added, removed, copy, opts):
2478 2478 content1 = None
2479 2479 content2 = None
2480 2480 flag1 = None
2481 2481 flag2 = None
2482 2482 if f1:
2483 2483 content1 = getfilectx(f1, ctx1).data()
2484 2484 if opts.git or losedatafn:
2485 2485 flag1 = ctx1.flags(f1)
2486 2486 if f2:
2487 2487 content2 = getfilectx(f2, ctx2).data()
2488 2488 if opts.git or losedatafn:
2489 2489 flag2 = ctx2.flags(f2)
2490 2490 binary = False
2491 2491 if opts.git or losedatafn:
2492 2492 binary = util.binary(content1) or util.binary(content2)
2493 2493
2494 2494 if losedatafn and not opts.git:
2495 2495 if (binary or
2496 2496 # copy/rename
2497 2497 f2 in copy or
2498 2498 # empty file creation
2499 2499 (not f1 and not content2) or
2500 2500 # empty file deletion
2501 2501 (not content1 and not f2) or
2502 2502 # create with flags
2503 2503 (not f1 and flag2) or
2504 2504 # change flags
2505 2505 (f1 and f2 and flag1 != flag2)):
2506 2506 losedatafn(f2 or f1)
2507 2507
2508 2508 path1 = f1 or f2
2509 2509 path2 = f2 or f1
2510 2510 path1 = posixpath.join(prefix, path1[len(relroot):])
2511 2511 path2 = posixpath.join(prefix, path2[len(relroot):])
2512 2512 header = []
2513 2513 if opts.git:
2514 2514 header.append('diff --git %s%s %s%s' %
2515 2515 (aprefix, path1, bprefix, path2))
2516 2516 if not f1: # added
2517 2517 header.append('new file mode %s' % gitmode[flag2])
2518 2518 elif not f2: # removed
2519 2519 header.append('deleted file mode %s' % gitmode[flag1])
2520 2520 else: # modified/copied/renamed
2521 2521 mode1, mode2 = gitmode[flag1], gitmode[flag2]
2522 2522 if mode1 != mode2:
2523 2523 header.append('old mode %s' % mode1)
2524 2524 header.append('new mode %s' % mode2)
2525 2525 if copyop is not None:
2526 2526 if opts.showsimilarity:
2527 2527 sim = similar.score(ctx1[path1], ctx2[path2]) * 100
2528 2528 header.append('similarity index %d%%' % sim)
2529 2529 header.append('%s from %s' % (copyop, path1))
2530 2530 header.append('%s to %s' % (copyop, path2))
2531 2531 elif revs and not repo.ui.quiet:
2532 2532 header.append(diffline(path1, revs))
2533 2533
2534 2534 if binary and opts.git and not opts.nobinary:
2535 2535 text = mdiff.b85diff(content1, content2)
2536 2536 if text:
2537 2537 header.append('index %s..%s' %
2538 2538 (gitindex(content1), gitindex(content2)))
2539 2539 else:
2540 2540 if opts.git and opts.index > 0:
2541 2541 flag = flag1
2542 2542 if flag is None:
2543 2543 flag = flag2
2544 2544 header.append('index %s..%s %s' %
2545 2545 (gitindex(content1)[0:opts.index],
2546 2546 gitindex(content2)[0:opts.index],
2547 2547 gitmode[flag]))
2548 2548
2549 2549 text = mdiff.unidiff(content1, date1,
2550 2550 content2, date2,
2551 2551 path1, path2, opts=opts)
2552 2552 if header and (text or len(header) > 1):
2553 2553 yield '\n'.join(header) + '\n'
2554 2554 if text:
2555 2555 yield text
2556 2556
2557 2557 def diffstatsum(stats):
2558 2558 maxfile, maxtotal, addtotal, removetotal, binary = 0, 0, 0, 0, False
2559 2559 for f, a, r, b in stats:
2560 2560 maxfile = max(maxfile, encoding.colwidth(f))
2561 2561 maxtotal = max(maxtotal, a + r)
2562 2562 addtotal += a
2563 2563 removetotal += r
2564 2564 binary = binary or b
2565 2565
2566 2566 return maxfile, maxtotal, addtotal, removetotal, binary
2567 2567
2568 2568 def diffstatdata(lines):
2569 2569 diffre = re.compile('^diff .*-r [a-z0-9]+\s(.*)$')
2570 2570
2571 2571 results = []
2572 2572 filename, adds, removes, isbinary = None, 0, 0, False
2573 2573
2574 2574 def addresult():
2575 2575 if filename:
2576 2576 results.append((filename, adds, removes, isbinary))
2577 2577
2578 2578 for line in lines:
2579 2579 if line.startswith('diff'):
2580 2580 addresult()
2581 2581 # set numbers to 0 anyway when starting new file
2582 2582 adds, removes, isbinary = 0, 0, False
2583 2583 if line.startswith('diff --git a/'):
2584 2584 filename = gitre.search(line).group(2)
2585 2585 elif line.startswith('diff -r'):
2586 2586 # format: "diff -r ... -r ... filename"
2587 2587 filename = diffre.search(line).group(1)
2588 2588 elif line.startswith('+') and not line.startswith('+++ '):
2589 2589 adds += 1
2590 2590 elif line.startswith('-') and not line.startswith('--- '):
2591 2591 removes += 1
2592 2592 elif (line.startswith('GIT binary patch') or
2593 2593 line.startswith('Binary file')):
2594 2594 isbinary = True
2595 2595 addresult()
2596 2596 return results
2597 2597
2598 2598 def diffstat(lines, width=80):
2599 2599 output = []
2600 2600 stats = diffstatdata(lines)
2601 2601 maxname, maxtotal, totaladds, totalremoves, hasbinary = diffstatsum(stats)
2602 2602
2603 2603 countwidth = len(str(maxtotal))
2604 2604 if hasbinary and countwidth < 3:
2605 2605 countwidth = 3
2606 2606 graphwidth = width - countwidth - maxname - 6
2607 2607 if graphwidth < 10:
2608 2608 graphwidth = 10
2609 2609
2610 2610 def scale(i):
2611 2611 if maxtotal <= graphwidth:
2612 2612 return i
2613 2613 # If diffstat runs out of room it doesn't print anything,
2614 2614 # which isn't very useful, so always print at least one + or -
2615 2615 # if there were at least some changes.
2616 2616 return max(i * graphwidth // maxtotal, int(bool(i)))
2617 2617
2618 2618 for filename, adds, removes, isbinary in stats:
2619 2619 if isbinary:
2620 2620 count = 'Bin'
2621 2621 else:
2622 2622 count = adds + removes
2623 2623 pluses = '+' * scale(adds)
2624 2624 minuses = '-' * scale(removes)
2625 2625 output.append(' %s%s | %*s %s%s\n' %
2626 2626 (filename, ' ' * (maxname - encoding.colwidth(filename)),
2627 2627 countwidth, count, pluses, minuses))
2628 2628
2629 2629 if stats:
2630 2630 output.append(_(' %d files changed, %d insertions(+), '
2631 2631 '%d deletions(-)\n')
2632 2632 % (len(stats), totaladds, totalremoves))
2633 2633
2634 2634 return ''.join(output)
2635 2635
2636 2636 def diffstatui(*args, **kw):
2637 2637 '''like diffstat(), but yields 2-tuples of (output, label) for
2638 2638 ui.write()
2639 2639 '''
2640 2640
2641 2641 for line in diffstat(*args, **kw).splitlines():
2642 2642 if line and line[-1] in '+-':
2643 2643 name, graph = line.rsplit(' ', 1)
2644 2644 yield (name + ' ', '')
2645 2645 m = re.search(r'\++', graph)
2646 2646 if m:
2647 2647 yield (m.group(0), 'diffstat.inserted')
2648 2648 m = re.search(r'-+', graph)
2649 2649 if m:
2650 2650 yield (m.group(0), 'diffstat.deleted')
2651 2651 else:
2652 2652 yield (line, '')
2653 2653 yield ('\n', '')
@@ -1,366 +1,388 b''
1 1 $ hg init repo
2 2 $ cd repo
3 3 $ cat > a <<EOF
4 4 > c
5 5 > c
6 6 > a
7 7 > a
8 8 > b
9 9 > a
10 10 > a
11 11 > c
12 12 > c
13 13 > EOF
14 14 $ hg ci -Am adda
15 15 adding a
16 16
17 17 $ cat > a <<EOF
18 18 > c
19 19 > c
20 20 > a
21 21 > a
22 22 > dd
23 23 > a
24 24 > a
25 25 > c
26 26 > c
27 27 > EOF
28 28
29 29 default context
30 30
31 31 $ hg diff --nodates
32 32 diff -r cf9f4ba66af2 a
33 33 --- a/a
34 34 +++ b/a
35 35 @@ -2,7 +2,7 @@
36 36 c
37 37 a
38 38 a
39 39 -b
40 40 +dd
41 41 a
42 42 a
43 43 c
44 44
45 45 invalid --unified
46 46
47 47 $ hg diff --nodates -U foo
48 48 abort: diff context lines count must be an integer, not 'foo'
49 49 [255]
50 50
51 51
52 52 $ hg diff --nodates -U 2
53 53 diff -r cf9f4ba66af2 a
54 54 --- a/a
55 55 +++ b/a
56 56 @@ -3,5 +3,5 @@
57 57 a
58 58 a
59 59 -b
60 60 +dd
61 61 a
62 62 a
63 63
64 64 $ hg --config diff.unified=2 diff --nodates
65 65 diff -r cf9f4ba66af2 a
66 66 --- a/a
67 67 +++ b/a
68 68 @@ -3,5 +3,5 @@
69 69 a
70 70 a
71 71 -b
72 72 +dd
73 73 a
74 74 a
75 75
76 76 $ hg diff --nodates -U 1
77 77 diff -r cf9f4ba66af2 a
78 78 --- a/a
79 79 +++ b/a
80 80 @@ -4,3 +4,3 @@
81 81 a
82 82 -b
83 83 +dd
84 84 a
85 85
86 86 invalid diff.unified
87 87
88 88 $ hg --config diff.unified=foo diff --nodates
89 89 abort: diff context lines count must be an integer, not 'foo'
90 90 [255]
91 91
92 92 noprefix config and option
93 93
94 94 $ hg --config diff.noprefix=True diff --nodates
95 95 diff -r cf9f4ba66af2 a
96 96 --- a
97 97 +++ a
98 98 @@ -2,7 +2,7 @@
99 99 c
100 100 a
101 101 a
102 102 -b
103 103 +dd
104 104 a
105 105 a
106 106 c
107 107 $ hg diff --noprefix --nodates
108 108 diff -r cf9f4ba66af2 a
109 109 --- a
110 110 +++ a
111 111 @@ -2,7 +2,7 @@
112 112 c
113 113 a
114 114 a
115 115 -b
116 116 +dd
117 117 a
118 118 a
119 119 c
120 120
121 121 noprefix config disabled in plain mode, but option still enabled
122 122
123 123 $ HGPLAIN=1 hg --config diff.noprefix=True diff --nodates
124 124 diff -r cf9f4ba66af2 a
125 125 --- a/a
126 126 +++ b/a
127 127 @@ -2,7 +2,7 @@
128 128 c
129 129 a
130 130 a
131 131 -b
132 132 +dd
133 133 a
134 134 a
135 135 c
136 136 $ HGPLAIN=1 hg diff --noprefix --nodates
137 137 diff -r cf9f4ba66af2 a
138 138 --- a
139 139 +++ a
140 140 @@ -2,7 +2,7 @@
141 141 c
142 142 a
143 143 a
144 144 -b
145 145 +dd
146 146 a
147 147 a
148 148 c
149 149
150 150 $ cd ..
151 151
152 152
153 153 0 lines of context hunk header matches gnu diff hunk header
154 154
155 155 $ hg init diffzero
156 156 $ cd diffzero
157 157 $ cat > f1 << EOF
158 158 > c2
159 159 > c4
160 160 > c5
161 161 > EOF
162 162 $ hg commit -Am0
163 163 adding f1
164 164
165 165 $ cat > f2 << EOF
166 166 > c1
167 167 > c2
168 168 > c3
169 169 > c4
170 170 > EOF
171 171 $ mv f2 f1
172 172 $ hg diff -U0 --nodates
173 173 diff -r 55d8ff78db23 f1
174 174 --- a/f1
175 175 +++ b/f1
176 176 @@ -0,0 +1,1 @@
177 177 +c1
178 178 @@ -1,0 +3,1 @@
179 179 +c3
180 180 @@ -3,1 +4,0 @@
181 181 -c5
182 182
183 183 $ hg diff -U0 --nodates --git
184 184 diff --git a/f1 b/f1
185 185 --- a/f1
186 186 +++ b/f1
187 187 @@ -0,0 +1,1 @@
188 188 +c1
189 189 @@ -1,0 +3,1 @@
190 190 +c3
191 191 @@ -3,1 +4,0 @@
192 192 -c5
193 193
194 194 $ hg diff -U0 --nodates -p
195 195 diff -r 55d8ff78db23 f1
196 196 --- a/f1
197 197 +++ b/f1
198 198 @@ -0,0 +1,1 @@
199 199 +c1
200 200 @@ -1,0 +3,1 @@ c2
201 201 +c3
202 202 @@ -3,1 +4,0 @@ c4
203 203 -c5
204 204
205 205 $ echo a > f1
206 206 $ hg ci -m movef2
207 207
208 208 Test diff headers terminating with TAB when necessary (issue3357)
209 209 Regular diff --nodates, file creation
210 210
211 211 $ hg mv f1 'f 1'
212 212 $ echo b > 'f 1'
213 213 $ hg diff --nodates 'f 1'
214 214 diff -r 7574207d0d15 f 1
215 215 --- /dev/null
216 216 +++ b/f 1
217 217 @@ -0,0 +1,1 @@
218 218 +b
219 219
220 220 Git diff, adding space
221 221
222 222 $ hg diff --git
223 223 diff --git a/f1 b/f 1
224 224 rename from f1
225 225 rename to f 1
226 226 --- a/f1
227 227 +++ b/f 1
228 228 @@ -1,1 +1,1 @@
229 229 -a
230 230 +b
231 231
232 232 Git diff, adding extended headers
233 233
234 234 $ hg diff --git --config experimental.extendedheader.index=7 --config experimental.extendedheader.similarity=True
235 235 diff --git a/f1 b/f 1
236 236 similarity index 0%
237 237 rename from f1
238 238 rename to f 1
239 239 index 7898192..6178079 100644
240 240 --- a/f1
241 241 +++ b/f 1
242 242 @@ -1,1 +1,1 @@
243 243 -a
244 244 +b
245 245
246 $ hg diff --git --config experimental.extendedheader.index=-1
247 invalid length for extendedheader.index: '-1'
248 diff --git a/f1 b/f 1
249 rename from f1
250 rename to f 1
251 --- a/f1
252 +++ b/f 1
253 @@ -1,1 +1,1 @@
254 -a
255 +b
256
257 $ hg diff --git --config experimental.extendedheader.index=whatever
258 invalid value for extendedheader.index: 'whatever'
259 diff --git a/f1 b/f 1
260 rename from f1
261 rename to f 1
262 --- a/f1
263 +++ b/f 1
264 @@ -1,1 +1,1 @@
265 -a
266 +b
267
246 268 Git diff with noprefix
247 269
248 270 $ hg --config diff.noprefix=True diff --git --nodates
249 271 diff --git f1 f 1
250 272 rename from f1
251 273 rename to f 1
252 274 --- f1
253 275 +++ f 1
254 276 @@ -1,1 +1,1 @@
255 277 -a
256 278 +b
257 279
258 280 noprefix config disabled in plain mode, but option still enabled
259 281
260 282 $ HGPLAIN=1 hg --config diff.noprefix=True diff --git --nodates
261 283 diff --git a/f1 b/f 1
262 284 rename from f1
263 285 rename to f 1
264 286 --- a/f1
265 287 +++ b/f 1
266 288 @@ -1,1 +1,1 @@
267 289 -a
268 290 +b
269 291 $ HGPLAIN=1 hg diff --git --noprefix --nodates
270 292 diff --git f1 f 1
271 293 rename from f1
272 294 rename to f 1
273 295 --- f1
274 296 +++ f 1
275 297 @@ -1,1 +1,1 @@
276 298 -a
277 299 +b
278 300
279 301 Regular diff --nodates, file deletion
280 302
281 303 $ hg ci -m addspace
282 304 $ hg mv 'f 1' f1
283 305 $ echo a > f1
284 306 $ hg diff --nodates 'f 1'
285 307 diff -r ca50fe67c9c7 f 1
286 308 --- a/f 1
287 309 +++ /dev/null
288 310 @@ -1,1 +0,0 @@
289 311 -b
290 312
291 313 Git diff, removing space
292 314
293 315 $ hg diff --git
294 316 diff --git a/f 1 b/f1
295 317 rename from f 1
296 318 rename to f1
297 319 --- a/f 1
298 320 +++ b/f1
299 321 @@ -1,1 +1,1 @@
300 322 -b
301 323 +a
302 324
303 325 showfunc diff
304 326 $ cat > f1 << EOF
305 327 > int main() {
306 328 > int a = 0;
307 329 > int b = 1;
308 330 > int c = 2;
309 331 > int d = 3;
310 332 > return a + b + c + d;
311 333 > }
312 334 > EOF
313 335 $ hg commit -m addfunction
314 336 $ cat > f1 << EOF
315 337 > int main() {
316 338 > int a = 0;
317 339 > int b = 1;
318 340 > int c = 2;
319 341 > int e = 3;
320 342 > return a + b + c + e;
321 343 > }
322 344 > EOF
323 345 $ hg diff --git
324 346 diff --git a/f1 b/f1
325 347 --- a/f1
326 348 +++ b/f1
327 349 @@ -2,6 +2,6 @@
328 350 int a = 0;
329 351 int b = 1;
330 352 int c = 2;
331 353 - int d = 3;
332 354 - return a + b + c + d;
333 355 + int e = 3;
334 356 + return a + b + c + e;
335 357 }
336 358 $ hg diff --config diff.showfunc=True --git
337 359 diff --git a/f1 b/f1
338 360 --- a/f1
339 361 +++ b/f1
340 362 @@ -2,6 +2,6 @@ int main() {
341 363 int a = 0;
342 364 int b = 1;
343 365 int c = 2;
344 366 - int d = 3;
345 367 - return a + b + c + d;
346 368 + int e = 3;
347 369 + return a + b + c + e;
348 370 }
349 371
350 372 If [diff] git is set to true, but the user says --no-git, we should
351 373 *not* get git diffs
352 374 $ hg diff --nodates --config diff.git=1 --no-git
353 375 diff -r f2c7c817fa55 f1
354 376 --- a/f1
355 377 +++ b/f1
356 378 @@ -2,6 +2,6 @@
357 379 int a = 0;
358 380 int b = 1;
359 381 int c = 2;
360 382 - int d = 3;
361 383 - return a + b + c + d;
362 384 + int e = 3;
363 385 + return a + b + c + e;
364 386 }
365 387
366 388 $ cd ..
General Comments 0
You need to be logged in to leave comments. Login now