##// END OF EJS Templates
patch: stop modifying gitpatch objects...
Patrick Mezard -
r14389:909ac6b9 default
parent child Browse files
Show More
@@ -1,1783 +1,1778 b''
1 1 # patch.py - patch file parsing routines
2 2 #
3 3 # Copyright 2006 Brendan Cully <brendan@kublai.com>
4 4 # Copyright 2007 Chris Mason <chris.mason@oracle.com>
5 5 #
6 6 # This software may be used and distributed according to the terms of the
7 7 # GNU General Public License version 2 or any later version.
8 8
9 9 import cStringIO, email.Parser, os, errno, re
10 10 import tempfile, zlib
11 11
12 12 from i18n import _
13 13 from node import hex, nullid, short
14 14 import base85, mdiff, scmutil, util, diffhelpers, copies, encoding
15 15
16 16 gitre = re.compile('diff --git a/(.*) b/(.*)')
17 17
18 18 class PatchError(Exception):
19 19 pass
20 20
21 21
22 22 # public functions
23 23
24 24 def split(stream):
25 25 '''return an iterator of individual patches from a stream'''
26 26 def isheader(line, inheader):
27 27 if inheader and line[0] in (' ', '\t'):
28 28 # continuation
29 29 return True
30 30 if line[0] in (' ', '-', '+'):
31 31 # diff line - don't check for header pattern in there
32 32 return False
33 33 l = line.split(': ', 1)
34 34 return len(l) == 2 and ' ' not in l[0]
35 35
36 36 def chunk(lines):
37 37 return cStringIO.StringIO(''.join(lines))
38 38
39 39 def hgsplit(stream, cur):
40 40 inheader = True
41 41
42 42 for line in stream:
43 43 if not line.strip():
44 44 inheader = False
45 45 if not inheader and line.startswith('# HG changeset patch'):
46 46 yield chunk(cur)
47 47 cur = []
48 48 inheader = True
49 49
50 50 cur.append(line)
51 51
52 52 if cur:
53 53 yield chunk(cur)
54 54
55 55 def mboxsplit(stream, cur):
56 56 for line in stream:
57 57 if line.startswith('From '):
58 58 for c in split(chunk(cur[1:])):
59 59 yield c
60 60 cur = []
61 61
62 62 cur.append(line)
63 63
64 64 if cur:
65 65 for c in split(chunk(cur[1:])):
66 66 yield c
67 67
68 68 def mimesplit(stream, cur):
69 69 def msgfp(m):
70 70 fp = cStringIO.StringIO()
71 71 g = email.Generator.Generator(fp, mangle_from_=False)
72 72 g.flatten(m)
73 73 fp.seek(0)
74 74 return fp
75 75
76 76 for line in stream:
77 77 cur.append(line)
78 78 c = chunk(cur)
79 79
80 80 m = email.Parser.Parser().parse(c)
81 81 if not m.is_multipart():
82 82 yield msgfp(m)
83 83 else:
84 84 ok_types = ('text/plain', 'text/x-diff', 'text/x-patch')
85 85 for part in m.walk():
86 86 ct = part.get_content_type()
87 87 if ct not in ok_types:
88 88 continue
89 89 yield msgfp(part)
90 90
91 91 def headersplit(stream, cur):
92 92 inheader = False
93 93
94 94 for line in stream:
95 95 if not inheader and isheader(line, inheader):
96 96 yield chunk(cur)
97 97 cur = []
98 98 inheader = True
99 99 if inheader and not isheader(line, inheader):
100 100 inheader = False
101 101
102 102 cur.append(line)
103 103
104 104 if cur:
105 105 yield chunk(cur)
106 106
107 107 def remainder(cur):
108 108 yield chunk(cur)
109 109
110 110 class fiter(object):
111 111 def __init__(self, fp):
112 112 self.fp = fp
113 113
114 114 def __iter__(self):
115 115 return self
116 116
117 117 def next(self):
118 118 l = self.fp.readline()
119 119 if not l:
120 120 raise StopIteration
121 121 return l
122 122
123 123 inheader = False
124 124 cur = []
125 125
126 126 mimeheaders = ['content-type']
127 127
128 128 if not hasattr(stream, 'next'):
129 129 # http responses, for example, have readline but not next
130 130 stream = fiter(stream)
131 131
132 132 for line in stream:
133 133 cur.append(line)
134 134 if line.startswith('# HG changeset patch'):
135 135 return hgsplit(stream, cur)
136 136 elif line.startswith('From '):
137 137 return mboxsplit(stream, cur)
138 138 elif isheader(line, inheader):
139 139 inheader = True
140 140 if line.split(':', 1)[0].lower() in mimeheaders:
141 141 # let email parser handle this
142 142 return mimesplit(stream, cur)
143 143 elif line.startswith('--- ') and inheader:
144 144 # No evil headers seen by diff start, split by hand
145 145 return headersplit(stream, cur)
146 146 # Not enough info, keep reading
147 147
148 148 # if we are here, we have a very plain patch
149 149 return remainder(cur)
150 150
151 151 def extract(ui, fileobj):
152 152 '''extract patch from data read from fileobj.
153 153
154 154 patch can be a normal patch or contained in an email message.
155 155
156 156 return tuple (filename, message, user, date, branch, node, p1, p2).
157 157 Any item in the returned tuple can be None. If filename is None,
158 158 fileobj did not contain a patch. Caller must unlink filename when done.'''
159 159
160 160 # attempt to detect the start of a patch
161 161 # (this heuristic is borrowed from quilt)
162 162 diffre = re.compile(r'^(?:Index:[ \t]|diff[ \t]|RCS file: |'
163 163 r'retrieving revision [0-9]+(\.[0-9]+)*$|'
164 164 r'---[ \t].*?^\+\+\+[ \t]|'
165 165 r'\*\*\*[ \t].*?^---[ \t])', re.MULTILINE|re.DOTALL)
166 166
167 167 fd, tmpname = tempfile.mkstemp(prefix='hg-patch-')
168 168 tmpfp = os.fdopen(fd, 'w')
169 169 try:
170 170 msg = email.Parser.Parser().parse(fileobj)
171 171
172 172 subject = msg['Subject']
173 173 user = msg['From']
174 174 if not subject and not user:
175 175 # Not an email, restore parsed headers if any
176 176 subject = '\n'.join(': '.join(h) for h in msg.items()) + '\n'
177 177
178 178 gitsendmail = 'git-send-email' in msg.get('X-Mailer', '')
179 179 # should try to parse msg['Date']
180 180 date = None
181 181 nodeid = None
182 182 branch = None
183 183 parents = []
184 184
185 185 if subject:
186 186 if subject.startswith('[PATCH'):
187 187 pend = subject.find(']')
188 188 if pend >= 0:
189 189 subject = subject[pend + 1:].lstrip()
190 190 subject = subject.replace('\n\t', ' ')
191 191 ui.debug('Subject: %s\n' % subject)
192 192 if user:
193 193 ui.debug('From: %s\n' % user)
194 194 diffs_seen = 0
195 195 ok_types = ('text/plain', 'text/x-diff', 'text/x-patch')
196 196 message = ''
197 197 for part in msg.walk():
198 198 content_type = part.get_content_type()
199 199 ui.debug('Content-Type: %s\n' % content_type)
200 200 if content_type not in ok_types:
201 201 continue
202 202 payload = part.get_payload(decode=True)
203 203 m = diffre.search(payload)
204 204 if m:
205 205 hgpatch = False
206 206 hgpatchheader = False
207 207 ignoretext = False
208 208
209 209 ui.debug('found patch at byte %d\n' % m.start(0))
210 210 diffs_seen += 1
211 211 cfp = cStringIO.StringIO()
212 212 for line in payload[:m.start(0)].splitlines():
213 213 if line.startswith('# HG changeset patch') and not hgpatch:
214 214 ui.debug('patch generated by hg export\n')
215 215 hgpatch = True
216 216 hgpatchheader = True
217 217 # drop earlier commit message content
218 218 cfp.seek(0)
219 219 cfp.truncate()
220 220 subject = None
221 221 elif hgpatchheader:
222 222 if line.startswith('# User '):
223 223 user = line[7:]
224 224 ui.debug('From: %s\n' % user)
225 225 elif line.startswith("# Date "):
226 226 date = line[7:]
227 227 elif line.startswith("# Branch "):
228 228 branch = line[9:]
229 229 elif line.startswith("# Node ID "):
230 230 nodeid = line[10:]
231 231 elif line.startswith("# Parent "):
232 232 parents.append(line[10:])
233 233 elif not line.startswith("# "):
234 234 hgpatchheader = False
235 235 elif line == '---' and gitsendmail:
236 236 ignoretext = True
237 237 if not hgpatchheader and not ignoretext:
238 238 cfp.write(line)
239 239 cfp.write('\n')
240 240 message = cfp.getvalue()
241 241 if tmpfp:
242 242 tmpfp.write(payload)
243 243 if not payload.endswith('\n'):
244 244 tmpfp.write('\n')
245 245 elif not diffs_seen and message and content_type == 'text/plain':
246 246 message += '\n' + payload
247 247 except:
248 248 tmpfp.close()
249 249 os.unlink(tmpname)
250 250 raise
251 251
252 252 if subject and not message.startswith(subject):
253 253 message = '%s\n%s' % (subject, message)
254 254 tmpfp.close()
255 255 if not diffs_seen:
256 256 os.unlink(tmpname)
257 257 return None, message, user, date, branch, None, None, None
258 258 p1 = parents and parents.pop(0) or None
259 259 p2 = parents and parents.pop(0) or None
260 260 return tmpname, message, user, date, branch, nodeid, p1, p2
261 261
262 262 class patchmeta(object):
263 263 """Patched file metadata
264 264
265 265 'op' is the performed operation within ADD, DELETE, RENAME, MODIFY
266 266 or COPY. 'path' is patched file path. 'oldpath' is set to the
267 267 origin file when 'op' is either COPY or RENAME, None otherwise. If
268 268 file mode is changed, 'mode' is a tuple (islink, isexec) where
269 269 'islink' is True if the file is a symlink and 'isexec' is True if
270 270 the file is executable. Otherwise, 'mode' is None.
271 271 """
272 272 def __init__(self, path):
273 273 self.path = path
274 274 self.oldpath = None
275 275 self.mode = None
276 276 self.op = 'MODIFY'
277 277 self.binary = False
278 278
279 279 def setmode(self, mode):
280 280 islink = mode & 020000
281 281 isexec = mode & 0100
282 282 self.mode = (islink, isexec)
283 283
284 284 def __repr__(self):
285 285 return "<patchmeta %s %r>" % (self.op, self.path)
286 286
287 287 def readgitpatch(lr):
288 288 """extract git-style metadata about patches from <patchname>"""
289 289
290 290 # Filter patch for git information
291 291 gp = None
292 292 gitpatches = []
293 293 for line in lr:
294 294 line = line.rstrip(' \r\n')
295 295 if line.startswith('diff --git'):
296 296 m = gitre.match(line)
297 297 if m:
298 298 if gp:
299 299 gitpatches.append(gp)
300 300 dst = m.group(2)
301 301 gp = patchmeta(dst)
302 302 elif gp:
303 303 if line.startswith('--- '):
304 304 gitpatches.append(gp)
305 305 gp = None
306 306 continue
307 307 if line.startswith('rename from '):
308 308 gp.op = 'RENAME'
309 309 gp.oldpath = line[12:]
310 310 elif line.startswith('rename to '):
311 311 gp.path = line[10:]
312 312 elif line.startswith('copy from '):
313 313 gp.op = 'COPY'
314 314 gp.oldpath = line[10:]
315 315 elif line.startswith('copy to '):
316 316 gp.path = line[8:]
317 317 elif line.startswith('deleted file'):
318 318 gp.op = 'DELETE'
319 319 elif line.startswith('new file mode '):
320 320 gp.op = 'ADD'
321 321 gp.setmode(int(line[-6:], 8))
322 322 elif line.startswith('new mode '):
323 323 gp.setmode(int(line[-6:], 8))
324 324 elif line.startswith('GIT binary patch'):
325 325 gp.binary = True
326 326 if gp:
327 327 gitpatches.append(gp)
328 328
329 329 return gitpatches
330 330
331 331 class linereader(object):
332 332 # simple class to allow pushing lines back into the input stream
333 333 def __init__(self, fp, textmode=False):
334 334 self.fp = fp
335 335 self.buf = []
336 336 self.textmode = textmode
337 337 self.eol = None
338 338
339 339 def push(self, line):
340 340 if line is not None:
341 341 self.buf.append(line)
342 342
343 343 def readline(self):
344 344 if self.buf:
345 345 l = self.buf[0]
346 346 del self.buf[0]
347 347 return l
348 348 l = self.fp.readline()
349 349 if not self.eol:
350 350 if l.endswith('\r\n'):
351 351 self.eol = '\r\n'
352 352 elif l.endswith('\n'):
353 353 self.eol = '\n'
354 354 if self.textmode and l.endswith('\r\n'):
355 355 l = l[:-2] + '\n'
356 356 return l
357 357
358 358 def __iter__(self):
359 359 while 1:
360 360 l = self.readline()
361 361 if not l:
362 362 break
363 363 yield l
364 364
365 365 class abstractbackend(object):
366 366 def __init__(self, ui):
367 367 self.ui = ui
368 368
369 369 def readlines(self, fname):
370 370 """Return target file lines, or its content as a single line
371 371 for symlinks.
372 372 """
373 373 raise NotImplementedError
374 374
375 375 def writelines(self, fname, lines, mode):
376 376 """Write lines to target file. mode is a (islink, isexec)
377 377 tuple, or None if there is no mode information.
378 378 """
379 379 raise NotImplementedError
380 380
381 381 def unlink(self, fname):
382 382 """Unlink target file."""
383 383 raise NotImplementedError
384 384
385 385 def writerej(self, fname, failed, total, lines):
386 386 """Write rejected lines for fname. total is the number of hunks
387 387 which failed to apply and total the total number of hunks for this
388 388 files.
389 389 """
390 390 pass
391 391
392 392 def copy(self, src, dst):
393 393 """Copy src file into dst file. Create intermediate directories if
394 394 necessary. Files are specified relatively to the patching base
395 395 directory.
396 396 """
397 397 raise NotImplementedError
398 398
399 399 def exists(self, fname):
400 400 raise NotImplementedError
401 401
402 402 def setmode(self, fname, islink, isexec):
403 403 """Change target file mode."""
404 404 raise NotImplementedError
405 405
406 406 class fsbackend(abstractbackend):
407 407 def __init__(self, ui, basedir):
408 408 super(fsbackend, self).__init__(ui)
409 409 self.opener = scmutil.opener(basedir)
410 410
411 411 def _join(self, f):
412 412 return os.path.join(self.opener.base, f)
413 413
414 414 def readlines(self, fname):
415 415 if os.path.islink(self._join(fname)):
416 416 return [os.readlink(self._join(fname))]
417 417 fp = self.opener(fname, 'r')
418 418 try:
419 419 return list(fp)
420 420 finally:
421 421 fp.close()
422 422
423 423 def writelines(self, fname, lines, mode):
424 424 if not mode:
425 425 # Preserve mode information
426 426 isexec, islink = False, False
427 427 try:
428 428 isexec = os.lstat(self._join(fname)).st_mode & 0100 != 0
429 429 islink = os.path.islink(self._join(fname))
430 430 except OSError, e:
431 431 if e.errno != errno.ENOENT:
432 432 raise
433 433 else:
434 434 islink, isexec = mode
435 435 if islink:
436 436 self.opener.symlink(''.join(lines), fname)
437 437 else:
438 438 self.opener(fname, 'w').writelines(lines)
439 439 if isexec:
440 440 util.setflags(self._join(fname), False, True)
441 441
442 442 def unlink(self, fname):
443 443 try:
444 444 util.unlinkpath(self._join(fname))
445 445 except OSError, inst:
446 446 if inst.errno != errno.ENOENT:
447 447 raise
448 448
449 449 def writerej(self, fname, failed, total, lines):
450 450 fname = fname + ".rej"
451 451 self.ui.warn(
452 452 _("%d out of %d hunks FAILED -- saving rejects to file %s\n") %
453 453 (failed, total, fname))
454 454 fp = self.opener(fname, 'w')
455 455 fp.writelines(lines)
456 456 fp.close()
457 457
458 458 def copy(self, src, dst):
459 459 basedir = self.opener.base
460 460 abssrc, absdst = [scmutil.canonpath(basedir, basedir, x)
461 461 for x in [src, dst]]
462 462 if os.path.lexists(absdst):
463 463 raise util.Abort(_("cannot create %s: destination already exists")
464 464 % dst)
465 465 dstdir = os.path.dirname(absdst)
466 466 if dstdir and not os.path.isdir(dstdir):
467 467 try:
468 468 os.makedirs(dstdir)
469 469 except IOError:
470 470 raise util.Abort(
471 471 _("cannot create %s: unable to create destination directory")
472 472 % dst)
473 473 util.copyfile(abssrc, absdst)
474 474
475 475 def exists(self, fname):
476 476 return os.path.lexists(self._join(fname))
477 477
478 478 def setmode(self, fname, islink, isexec):
479 479 util.setflags(self._join(fname), islink, isexec)
480 480
481 481 class workingbackend(fsbackend):
482 482 def __init__(self, ui, repo, similarity):
483 483 super(workingbackend, self).__init__(ui, repo.root)
484 484 self.repo = repo
485 485 self.similarity = similarity
486 486 self.removed = set()
487 487 self.changed = set()
488 488 self.copied = []
489 489
490 490 def writelines(self, fname, lines, mode):
491 491 super(workingbackend, self).writelines(fname, lines, mode)
492 492 self.changed.add(fname)
493 493
494 494 def unlink(self, fname):
495 495 super(workingbackend, self).unlink(fname)
496 496 self.removed.add(fname)
497 497 self.changed.add(fname)
498 498
499 499 def copy(self, src, dst):
500 500 super(workingbackend, self).copy(src, dst)
501 501 self.copied.append((src, dst))
502 502 self.changed.add(dst)
503 503
504 504 def setmode(self, fname, islink, isexec):
505 505 super(workingbackend, self).setmode(fname, islink, isexec)
506 506 self.changed.add(fname)
507 507
508 508 def close(self):
509 509 wctx = self.repo[None]
510 510 addremoved = set(self.changed)
511 511 for src, dst in self.copied:
512 512 scmutil.dirstatecopy(self.ui, self.repo, wctx, src, dst)
513 513 addremoved.discard(src)
514 514 if (not self.similarity) and self.removed:
515 515 wctx.remove(sorted(self.removed))
516 516 if addremoved:
517 517 cwd = self.repo.getcwd()
518 518 if cwd:
519 519 addremoved = [util.pathto(self.repo.root, cwd, f)
520 520 for f in addremoved]
521 521 scmutil.addremove(self.repo, addremoved, similarity=self.similarity)
522 522 return sorted(self.changed)
523 523
524 524 # @@ -start,len +start,len @@ or @@ -start +start @@ if len is 1
525 525 unidesc = re.compile('@@ -(\d+)(,(\d+))? \+(\d+)(,(\d+))? @@')
526 526 contextdesc = re.compile('(---|\*\*\*) (\d+)(,(\d+))? (---|\*\*\*)')
527 527 eolmodes = ['strict', 'crlf', 'lf', 'auto']
528 528
529 529 class patchfile(object):
530 530 def __init__(self, ui, fname, backend, mode, missing=False,
531 531 eolmode='strict'):
532 532 self.fname = fname
533 533 self.eolmode = eolmode
534 534 self.eol = None
535 535 self.backend = backend
536 536 self.ui = ui
537 537 self.lines = []
538 538 self.exists = False
539 539 self.missing = missing
540 540 self.mode = mode
541 541 if not missing:
542 542 try:
543 543 self.lines = self.backend.readlines(fname)
544 544 if self.lines:
545 545 # Normalize line endings
546 546 if self.lines[0].endswith('\r\n'):
547 547 self.eol = '\r\n'
548 548 elif self.lines[0].endswith('\n'):
549 549 self.eol = '\n'
550 550 if eolmode != 'strict':
551 551 nlines = []
552 552 for l in self.lines:
553 553 if l.endswith('\r\n'):
554 554 l = l[:-2] + '\n'
555 555 nlines.append(l)
556 556 self.lines = nlines
557 557 self.exists = True
558 558 except IOError:
559 559 pass
560 560 else:
561 561 self.ui.warn(_("unable to find '%s' for patching\n") % self.fname)
562 562
563 563 self.hash = {}
564 564 self.dirty = 0
565 565 self.offset = 0
566 566 self.skew = 0
567 567 self.rej = []
568 568 self.fileprinted = False
569 569 self.printfile(False)
570 570 self.hunks = 0
571 571
572 572 def writelines(self, fname, lines, mode):
573 573 if self.eolmode == 'auto':
574 574 eol = self.eol
575 575 elif self.eolmode == 'crlf':
576 576 eol = '\r\n'
577 577 else:
578 578 eol = '\n'
579 579
580 580 if self.eolmode != 'strict' and eol and eol != '\n':
581 581 rawlines = []
582 582 for l in lines:
583 583 if l and l[-1] == '\n':
584 584 l = l[:-1] + eol
585 585 rawlines.append(l)
586 586 lines = rawlines
587 587
588 588 self.backend.writelines(fname, lines, mode)
589 589
590 590 def printfile(self, warn):
591 591 if self.fileprinted:
592 592 return
593 593 if warn or self.ui.verbose:
594 594 self.fileprinted = True
595 595 s = _("patching file %s\n") % self.fname
596 596 if warn:
597 597 self.ui.warn(s)
598 598 else:
599 599 self.ui.note(s)
600 600
601 601
602 602 def findlines(self, l, linenum):
603 603 # looks through the hash and finds candidate lines. The
604 604 # result is a list of line numbers sorted based on distance
605 605 # from linenum
606 606
607 607 cand = self.hash.get(l, [])
608 608 if len(cand) > 1:
609 609 # resort our list of potentials forward then back.
610 610 cand.sort(key=lambda x: abs(x - linenum))
611 611 return cand
612 612
613 613 def write_rej(self):
614 614 # our rejects are a little different from patch(1). This always
615 615 # creates rejects in the same form as the original patch. A file
616 616 # header is inserted so that you can run the reject through patch again
617 617 # without having to type the filename.
618 618 if not self.rej:
619 619 return
620 620 base = os.path.basename(self.fname)
621 621 lines = ["--- %s\n+++ %s\n" % (base, base)]
622 622 for x in self.rej:
623 623 for l in x.hunk:
624 624 lines.append(l)
625 625 if l[-1] != '\n':
626 626 lines.append("\n\ No newline at end of file\n")
627 627 self.backend.writerej(self.fname, len(self.rej), self.hunks, lines)
628 628
629 629 def apply(self, h):
630 630 if not h.complete():
631 631 raise PatchError(_("bad hunk #%d %s (%d %d %d %d)") %
632 632 (h.number, h.desc, len(h.a), h.lena, len(h.b),
633 633 h.lenb))
634 634
635 635 self.hunks += 1
636 636
637 637 if self.missing:
638 638 self.rej.append(h)
639 639 return -1
640 640
641 641 if self.exists and h.createfile():
642 642 self.ui.warn(_("file %s already exists\n") % self.fname)
643 643 self.rej.append(h)
644 644 return -1
645 645
646 646 if isinstance(h, binhunk):
647 647 if h.rmfile():
648 648 self.backend.unlink(self.fname)
649 649 else:
650 650 self.lines[:] = h.new()
651 651 self.offset += len(h.new())
652 652 self.dirty = True
653 653 return 0
654 654
655 655 horig = h
656 656 if (self.eolmode in ('crlf', 'lf')
657 657 or self.eolmode == 'auto' and self.eol):
658 658 # If new eols are going to be normalized, then normalize
659 659 # hunk data before patching. Otherwise, preserve input
660 660 # line-endings.
661 661 h = h.getnormalized()
662 662
663 663 # fast case first, no offsets, no fuzz
664 664 old = h.old()
665 665 # patch starts counting at 1 unless we are adding the file
666 666 if h.starta == 0:
667 667 start = 0
668 668 else:
669 669 start = h.starta + self.offset - 1
670 670 orig_start = start
671 671 # if there's skew we want to emit the "(offset %d lines)" even
672 672 # when the hunk cleanly applies at start + skew, so skip the
673 673 # fast case code
674 674 if self.skew == 0 and diffhelpers.testhunk(old, self.lines, start) == 0:
675 675 if h.rmfile():
676 676 self.backend.unlink(self.fname)
677 677 else:
678 678 self.lines[start : start + h.lena] = h.new()
679 679 self.offset += h.lenb - h.lena
680 680 self.dirty = True
681 681 return 0
682 682
683 683 # ok, we couldn't match the hunk. Lets look for offsets and fuzz it
684 684 self.hash = {}
685 685 for x, s in enumerate(self.lines):
686 686 self.hash.setdefault(s, []).append(x)
687 687 if h.hunk[-1][0] != ' ':
688 688 # if the hunk tried to put something at the bottom of the file
689 689 # override the start line and use eof here
690 690 search_start = len(self.lines)
691 691 else:
692 692 search_start = orig_start + self.skew
693 693
694 694 for fuzzlen in xrange(3):
695 695 for toponly in [True, False]:
696 696 old = h.old(fuzzlen, toponly)
697 697
698 698 cand = self.findlines(old[0][1:], search_start)
699 699 for l in cand:
700 700 if diffhelpers.testhunk(old, self.lines, l) == 0:
701 701 newlines = h.new(fuzzlen, toponly)
702 702 self.lines[l : l + len(old)] = newlines
703 703 self.offset += len(newlines) - len(old)
704 704 self.skew = l - orig_start
705 705 self.dirty = True
706 706 offset = l - orig_start - fuzzlen
707 707 if fuzzlen:
708 708 msg = _("Hunk #%d succeeded at %d "
709 709 "with fuzz %d "
710 710 "(offset %d lines).\n")
711 711 self.printfile(True)
712 712 self.ui.warn(msg %
713 713 (h.number, l + 1, fuzzlen, offset))
714 714 else:
715 715 msg = _("Hunk #%d succeeded at %d "
716 716 "(offset %d lines).\n")
717 717 self.ui.note(msg % (h.number, l + 1, offset))
718 718 return fuzzlen
719 719 self.printfile(True)
720 720 self.ui.warn(_("Hunk #%d FAILED at %d\n") % (h.number, orig_start))
721 721 self.rej.append(horig)
722 722 return -1
723 723
724 724 def close(self):
725 725 if self.dirty:
726 726 self.writelines(self.fname, self.lines, self.mode)
727 727 self.write_rej()
728 728 return len(self.rej)
729 729
730 730 class hunk(object):
731 731 def __init__(self, desc, num, lr, context, create=False, remove=False):
732 732 self.number = num
733 733 self.desc = desc
734 734 self.hunk = [desc]
735 735 self.a = []
736 736 self.b = []
737 737 self.starta = self.lena = None
738 738 self.startb = self.lenb = None
739 739 if lr is not None:
740 740 if context:
741 741 self.read_context_hunk(lr)
742 742 else:
743 743 self.read_unified_hunk(lr)
744 744 self.create = create
745 745 self.remove = remove and not create
746 746
747 747 def getnormalized(self):
748 748 """Return a copy with line endings normalized to LF."""
749 749
750 750 def normalize(lines):
751 751 nlines = []
752 752 for line in lines:
753 753 if line.endswith('\r\n'):
754 754 line = line[:-2] + '\n'
755 755 nlines.append(line)
756 756 return nlines
757 757
758 758 # Dummy object, it is rebuilt manually
759 759 nh = hunk(self.desc, self.number, None, None, False, False)
760 760 nh.number = self.number
761 761 nh.desc = self.desc
762 762 nh.hunk = self.hunk
763 763 nh.a = normalize(self.a)
764 764 nh.b = normalize(self.b)
765 765 nh.starta = self.starta
766 766 nh.startb = self.startb
767 767 nh.lena = self.lena
768 768 nh.lenb = self.lenb
769 769 nh.create = self.create
770 770 nh.remove = self.remove
771 771 return nh
772 772
773 773 def read_unified_hunk(self, lr):
774 774 m = unidesc.match(self.desc)
775 775 if not m:
776 776 raise PatchError(_("bad hunk #%d") % self.number)
777 777 self.starta, foo, self.lena, self.startb, foo2, self.lenb = m.groups()
778 778 if self.lena is None:
779 779 self.lena = 1
780 780 else:
781 781 self.lena = int(self.lena)
782 782 if self.lenb is None:
783 783 self.lenb = 1
784 784 else:
785 785 self.lenb = int(self.lenb)
786 786 self.starta = int(self.starta)
787 787 self.startb = int(self.startb)
788 788 diffhelpers.addlines(lr, self.hunk, self.lena, self.lenb, self.a, self.b)
789 789 # if we hit eof before finishing out the hunk, the last line will
790 790 # be zero length. Lets try to fix it up.
791 791 while len(self.hunk[-1]) == 0:
792 792 del self.hunk[-1]
793 793 del self.a[-1]
794 794 del self.b[-1]
795 795 self.lena -= 1
796 796 self.lenb -= 1
797 797 self._fixnewline(lr)
798 798
799 799 def read_context_hunk(self, lr):
800 800 self.desc = lr.readline()
801 801 m = contextdesc.match(self.desc)
802 802 if not m:
803 803 raise PatchError(_("bad hunk #%d") % self.number)
804 804 foo, self.starta, foo2, aend, foo3 = m.groups()
805 805 self.starta = int(self.starta)
806 806 if aend is None:
807 807 aend = self.starta
808 808 self.lena = int(aend) - self.starta
809 809 if self.starta:
810 810 self.lena += 1
811 811 for x in xrange(self.lena):
812 812 l = lr.readline()
813 813 if l.startswith('---'):
814 814 # lines addition, old block is empty
815 815 lr.push(l)
816 816 break
817 817 s = l[2:]
818 818 if l.startswith('- ') or l.startswith('! '):
819 819 u = '-' + s
820 820 elif l.startswith(' '):
821 821 u = ' ' + s
822 822 else:
823 823 raise PatchError(_("bad hunk #%d old text line %d") %
824 824 (self.number, x))
825 825 self.a.append(u)
826 826 self.hunk.append(u)
827 827
828 828 l = lr.readline()
829 829 if l.startswith('\ '):
830 830 s = self.a[-1][:-1]
831 831 self.a[-1] = s
832 832 self.hunk[-1] = s
833 833 l = lr.readline()
834 834 m = contextdesc.match(l)
835 835 if not m:
836 836 raise PatchError(_("bad hunk #%d") % self.number)
837 837 foo, self.startb, foo2, bend, foo3 = m.groups()
838 838 self.startb = int(self.startb)
839 839 if bend is None:
840 840 bend = self.startb
841 841 self.lenb = int(bend) - self.startb
842 842 if self.startb:
843 843 self.lenb += 1
844 844 hunki = 1
845 845 for x in xrange(self.lenb):
846 846 l = lr.readline()
847 847 if l.startswith('\ '):
848 848 # XXX: the only way to hit this is with an invalid line range.
849 849 # The no-eol marker is not counted in the line range, but I
850 850 # guess there are diff(1) out there which behave differently.
851 851 s = self.b[-1][:-1]
852 852 self.b[-1] = s
853 853 self.hunk[hunki - 1] = s
854 854 continue
855 855 if not l:
856 856 # line deletions, new block is empty and we hit EOF
857 857 lr.push(l)
858 858 break
859 859 s = l[2:]
860 860 if l.startswith('+ ') or l.startswith('! '):
861 861 u = '+' + s
862 862 elif l.startswith(' '):
863 863 u = ' ' + s
864 864 elif len(self.b) == 0:
865 865 # line deletions, new block is empty
866 866 lr.push(l)
867 867 break
868 868 else:
869 869 raise PatchError(_("bad hunk #%d old text line %d") %
870 870 (self.number, x))
871 871 self.b.append(s)
872 872 while True:
873 873 if hunki >= len(self.hunk):
874 874 h = ""
875 875 else:
876 876 h = self.hunk[hunki]
877 877 hunki += 1
878 878 if h == u:
879 879 break
880 880 elif h.startswith('-'):
881 881 continue
882 882 else:
883 883 self.hunk.insert(hunki - 1, u)
884 884 break
885 885
886 886 if not self.a:
887 887 # this happens when lines were only added to the hunk
888 888 for x in self.hunk:
889 889 if x.startswith('-') or x.startswith(' '):
890 890 self.a.append(x)
891 891 if not self.b:
892 892 # this happens when lines were only deleted from the hunk
893 893 for x in self.hunk:
894 894 if x.startswith('+') or x.startswith(' '):
895 895 self.b.append(x[1:])
896 896 # @@ -start,len +start,len @@
897 897 self.desc = "@@ -%d,%d +%d,%d @@\n" % (self.starta, self.lena,
898 898 self.startb, self.lenb)
899 899 self.hunk[0] = self.desc
900 900 self._fixnewline(lr)
901 901
902 902 def _fixnewline(self, lr):
903 903 l = lr.readline()
904 904 if l.startswith('\ '):
905 905 diffhelpers.fix_newline(self.hunk, self.a, self.b)
906 906 else:
907 907 lr.push(l)
908 908
909 909 def complete(self):
910 910 return len(self.a) == self.lena and len(self.b) == self.lenb
911 911
912 912 def createfile(self):
913 913 return self.starta == 0 and self.lena == 0 and self.create
914 914
915 915 def rmfile(self):
916 916 return self.startb == 0 and self.lenb == 0 and self.remove
917 917
918 918 def fuzzit(self, l, fuzz, toponly):
919 919 # this removes context lines from the top and bottom of list 'l'. It
920 920 # checks the hunk to make sure only context lines are removed, and then
921 921 # returns a new shortened list of lines.
922 922 fuzz = min(fuzz, len(l)-1)
923 923 if fuzz:
924 924 top = 0
925 925 bot = 0
926 926 hlen = len(self.hunk)
927 927 for x in xrange(hlen - 1):
928 928 # the hunk starts with the @@ line, so use x+1
929 929 if self.hunk[x + 1][0] == ' ':
930 930 top += 1
931 931 else:
932 932 break
933 933 if not toponly:
934 934 for x in xrange(hlen - 1):
935 935 if self.hunk[hlen - bot - 1][0] == ' ':
936 936 bot += 1
937 937 else:
938 938 break
939 939
940 940 # top and bot now count context in the hunk
941 941 # adjust them if either one is short
942 942 context = max(top, bot, 3)
943 943 if bot < context:
944 944 bot = max(0, fuzz - (context - bot))
945 945 else:
946 946 bot = min(fuzz, bot)
947 947 if top < context:
948 948 top = max(0, fuzz - (context - top))
949 949 else:
950 950 top = min(fuzz, top)
951 951
952 952 return l[top:len(l)-bot]
953 953 return l
954 954
955 955 def old(self, fuzz=0, toponly=False):
956 956 return self.fuzzit(self.a, fuzz, toponly)
957 957
958 958 def new(self, fuzz=0, toponly=False):
959 959 return self.fuzzit(self.b, fuzz, toponly)
960 960
961 961 class binhunk:
962 962 'A binary patch file. Only understands literals so far.'
963 963 def __init__(self, gitpatch, lr):
964 964 self.gitpatch = gitpatch
965 965 self.text = None
966 966 self.hunk = ['GIT binary patch\n']
967 967 self._read(lr)
968 968
969 969 def createfile(self):
970 970 return self.gitpatch.op == 'ADD'
971 971
972 972 def rmfile(self):
973 973 return self.gitpatch.op == 'DELETE'
974 974
975 975 def complete(self):
976 976 return self.text is not None
977 977
978 978 def new(self):
979 979 return [self.text]
980 980
981 981 def _read(self, lr):
982 982 line = lr.readline()
983 983 self.hunk.append(line)
984 984 while line and not line.startswith('literal '):
985 985 line = lr.readline()
986 986 self.hunk.append(line)
987 987 if not line:
988 988 raise PatchError(_('could not extract binary patch'))
989 989 size = int(line[8:].rstrip())
990 990 dec = []
991 991 line = lr.readline()
992 992 self.hunk.append(line)
993 993 while len(line) > 1:
994 994 l = line[0]
995 995 if l <= 'Z' and l >= 'A':
996 996 l = ord(l) - ord('A') + 1
997 997 else:
998 998 l = ord(l) - ord('a') + 27
999 999 dec.append(base85.b85decode(line[1:-1])[:l])
1000 1000 line = lr.readline()
1001 1001 self.hunk.append(line)
1002 1002 text = zlib.decompress(''.join(dec))
1003 1003 if len(text) != size:
1004 1004 raise PatchError(_('binary patch is %d bytes, not %d') %
1005 1005 len(text), size)
1006 1006 self.text = text
1007 1007
1008 1008 def parsefilename(str):
1009 1009 # --- filename \t|space stuff
1010 1010 s = str[4:].rstrip('\r\n')
1011 1011 i = s.find('\t')
1012 1012 if i < 0:
1013 1013 i = s.find(' ')
1014 1014 if i < 0:
1015 1015 return s
1016 1016 return s[:i]
1017 1017
1018 1018 def pathstrip(path, strip):
1019 1019 pathlen = len(path)
1020 1020 i = 0
1021 1021 if strip == 0:
1022 1022 return '', path.rstrip()
1023 1023 count = strip
1024 1024 while count > 0:
1025 1025 i = path.find('/', i)
1026 1026 if i == -1:
1027 1027 raise PatchError(_("unable to strip away %d of %d dirs from %s") %
1028 1028 (count, strip, path))
1029 1029 i += 1
1030 1030 # consume '//' in the path
1031 1031 while i < pathlen - 1 and path[i] == '/':
1032 1032 i += 1
1033 1033 count -= 1
1034 1034 return path[:i].lstrip(), path[i:].rstrip()
1035 1035
1036 1036 def selectfile(backend, afile_orig, bfile_orig, hunk, strip):
1037 1037 nulla = afile_orig == "/dev/null"
1038 1038 nullb = bfile_orig == "/dev/null"
1039 1039 abase, afile = pathstrip(afile_orig, strip)
1040 1040 gooda = not nulla and backend.exists(afile)
1041 1041 bbase, bfile = pathstrip(bfile_orig, strip)
1042 1042 if afile == bfile:
1043 1043 goodb = gooda
1044 1044 else:
1045 1045 goodb = not nullb and backend.exists(bfile)
1046 1046 createfunc = hunk.createfile
1047 1047 missing = not goodb and not gooda and not createfunc()
1048 1048
1049 1049 # some diff programs apparently produce patches where the afile is
1050 1050 # not /dev/null, but afile starts with bfile
1051 1051 abasedir = afile[:afile.rfind('/') + 1]
1052 1052 bbasedir = bfile[:bfile.rfind('/') + 1]
1053 1053 if missing and abasedir == bbasedir and afile.startswith(bfile):
1054 1054 # this isn't very pretty
1055 1055 hunk.create = True
1056 1056 if createfunc():
1057 1057 missing = False
1058 1058 else:
1059 1059 hunk.create = False
1060 1060
1061 1061 # If afile is "a/b/foo" and bfile is "a/b/foo.orig" we assume the
1062 1062 # diff is between a file and its backup. In this case, the original
1063 1063 # file should be patched (see original mpatch code).
1064 1064 isbackup = (abase == bbase and bfile.startswith(afile))
1065 1065 fname = None
1066 1066 if not missing:
1067 1067 if gooda and goodb:
1068 1068 fname = isbackup and afile or bfile
1069 1069 elif gooda:
1070 1070 fname = afile
1071 1071
1072 1072 if not fname:
1073 1073 if not nullb:
1074 1074 fname = isbackup and afile or bfile
1075 1075 elif not nulla:
1076 1076 fname = afile
1077 1077 else:
1078 1078 raise PatchError(_("undefined source and destination files"))
1079 1079
1080 1080 return fname, missing
1081 1081
1082 1082 def scangitpatch(lr, firstline):
1083 1083 """
1084 1084 Git patches can emit:
1085 1085 - rename a to b
1086 1086 - change b
1087 1087 - copy a to c
1088 1088 - change c
1089 1089
1090 1090 We cannot apply this sequence as-is, the renamed 'a' could not be
1091 1091 found for it would have been renamed already. And we cannot copy
1092 1092 from 'b' instead because 'b' would have been changed already. So
1093 1093 we scan the git patch for copy and rename commands so we can
1094 1094 perform the copies ahead of time.
1095 1095 """
1096 1096 pos = 0
1097 1097 try:
1098 1098 pos = lr.fp.tell()
1099 1099 fp = lr.fp
1100 1100 except IOError:
1101 1101 fp = cStringIO.StringIO(lr.fp.read())
1102 1102 gitlr = linereader(fp, lr.textmode)
1103 1103 gitlr.push(firstline)
1104 1104 gitpatches = readgitpatch(gitlr)
1105 1105 fp.seek(pos)
1106 1106 return gitpatches
1107 1107
1108 1108 def iterhunks(fp):
1109 1109 """Read a patch and yield the following events:
1110 1110 - ("file", afile, bfile, firsthunk): select a new target file.
1111 1111 - ("hunk", hunk): a new hunk is ready to be applied, follows a
1112 1112 "file" event.
1113 1113 - ("git", gitchanges): current diff is in git format, gitchanges
1114 1114 maps filenames to gitpatch records. Unique event.
1115 1115 """
1116 1116 afile = ""
1117 1117 bfile = ""
1118 1118 state = None
1119 1119 hunknum = 0
1120 1120 emitfile = newfile = False
1121 1121 gitpatches = None
1122 1122
1123 1123 # our states
1124 1124 BFILE = 1
1125 1125 context = None
1126 1126 lr = linereader(fp)
1127 1127
1128 1128 while True:
1129 1129 x = lr.readline()
1130 1130 if not x:
1131 1131 break
1132 1132 if state == BFILE and (
1133 1133 (not context and x[0] == '@')
1134 1134 or (context is not False and x.startswith('***************'))
1135 1135 or x.startswith('GIT binary patch')):
1136 1136 gp = None
1137 1137 if gitpatches and gitpatches[-1][0] == bfile:
1138 1138 gp = gitpatches.pop()[1]
1139 1139 if x.startswith('GIT binary patch'):
1140 1140 h = binhunk(gp, lr)
1141 1141 else:
1142 1142 if context is None and x.startswith('***************'):
1143 1143 context = True
1144 1144 create = afile == '/dev/null' or gp and gp.op == 'ADD'
1145 1145 remove = bfile == '/dev/null' or gp and gp.op == 'DELETE'
1146 1146 h = hunk(x, hunknum + 1, lr, context, create, remove)
1147 1147 hunknum += 1
1148 1148 if emitfile:
1149 1149 emitfile = False
1150 1150 yield 'file', (afile, bfile, h, gp)
1151 1151 yield 'hunk', h
1152 1152 elif x.startswith('diff --git'):
1153 1153 m = gitre.match(x)
1154 1154 if not m:
1155 1155 continue
1156 1156 if gitpatches is None:
1157 1157 # scan whole input for git metadata
1158 1158 gitpatches = [('b/' + gp.path, gp) for gp
1159 1159 in scangitpatch(lr, x)]
1160 yield 'git', [g[1] for g in gitpatches]
1160 yield 'git', [g[1] for g in gitpatches
1161 if g[1].op in ('COPY', 'RENAME')]
1161 1162 gitpatches.reverse()
1162 1163 afile = 'a/' + m.group(1)
1163 1164 bfile = 'b/' + m.group(2)
1164 1165 while bfile != gitpatches[-1][0]:
1165 1166 gp = gitpatches.pop()[1]
1166 1167 yield 'file', ('a/' + gp.path, 'b/' + gp.path, None, gp)
1167 1168 gp = gitpatches[-1][1]
1168 1169 # copy/rename + modify should modify target, not source
1169 1170 if gp.op in ('COPY', 'DELETE', 'RENAME', 'ADD') or gp.mode:
1170 1171 afile = bfile
1171 1172 newfile = True
1172 1173 elif x.startswith('---'):
1173 1174 # check for a unified diff
1174 1175 l2 = lr.readline()
1175 1176 if not l2.startswith('+++'):
1176 1177 lr.push(l2)
1177 1178 continue
1178 1179 newfile = True
1179 1180 context = False
1180 1181 afile = parsefilename(x)
1181 1182 bfile = parsefilename(l2)
1182 1183 elif x.startswith('***'):
1183 1184 # check for a context diff
1184 1185 l2 = lr.readline()
1185 1186 if not l2.startswith('---'):
1186 1187 lr.push(l2)
1187 1188 continue
1188 1189 l3 = lr.readline()
1189 1190 lr.push(l3)
1190 1191 if not l3.startswith("***************"):
1191 1192 lr.push(l2)
1192 1193 continue
1193 1194 newfile = True
1194 1195 context = True
1195 1196 afile = parsefilename(x)
1196 1197 bfile = parsefilename(l2)
1197 1198
1198 1199 if newfile:
1199 1200 newfile = False
1200 1201 emitfile = True
1201 1202 state = BFILE
1202 1203 hunknum = 0
1203 1204
1204 1205 while gitpatches:
1205 1206 gp = gitpatches.pop()[1]
1206 1207 yield 'file', ('a/' + gp.path, 'b/' + gp.path, None, gp)
1207 1208
1208 1209 def applydiff(ui, fp, changed, backend, strip=1, eolmode='strict'):
1209 1210 """Reads a patch from fp and tries to apply it.
1210 1211
1211 1212 The dict 'changed' is filled in with all of the filenames changed
1212 1213 by the patch. Returns 0 for a clean patch, -1 if any rejects were
1213 1214 found and 1 if there was any fuzz.
1214 1215
1215 1216 If 'eolmode' is 'strict', the patch content and patched file are
1216 1217 read in binary mode. Otherwise, line endings are ignored when
1217 1218 patching then normalized according to 'eolmode'.
1218 1219 """
1219 1220 return _applydiff(ui, fp, patchfile, backend, changed, strip=strip,
1220 1221 eolmode=eolmode)
1221 1222
1222 1223 def _applydiff(ui, fp, patcher, backend, changed, strip=1, eolmode='strict'):
1224
1225 def pstrip(p):
1226 return pathstrip(p, strip - 1)[1]
1227
1223 1228 rejects = 0
1224 1229 err = 0
1225 1230 current_file = None
1226 1231
1227 1232 for state, values in iterhunks(fp):
1228 1233 if state == 'hunk':
1229 1234 if not current_file:
1230 1235 continue
1231 1236 ret = current_file.apply(values)
1232 1237 if ret >= 0:
1233 1238 changed.setdefault(current_file.fname, None)
1234 1239 if ret > 0:
1235 1240 err = 1
1236 1241 elif state == 'file':
1237 1242 if current_file:
1238 1243 rejects += current_file.close()
1239 1244 current_file = None
1240 1245 afile, bfile, first_hunk, gp = values
1241 1246 if gp:
1242 changed[gp.path] = gp
1247 path = pstrip(gp.path)
1248 changed[path] = gp
1243 1249 if gp.op == 'DELETE':
1244 backend.unlink(gp.path)
1250 backend.unlink(path)
1245 1251 continue
1246 1252 if gp.op == 'RENAME':
1247 backend.unlink(gp.oldpath)
1253 backend.unlink(pstrip(gp.oldpath))
1248 1254 if gp.mode and not first_hunk:
1249 1255 if gp.op == 'ADD':
1250 1256 # Added files without content have no hunk and must be created
1251 backend.writelines(gp.path, [], gp.mode)
1257 backend.writelines(path, [], gp.mode)
1252 1258 else:
1253 backend.setmode(gp.path, gp.mode[0], gp.mode[1])
1259 backend.setmode(path, gp.mode[0], gp.mode[1])
1254 1260 if not first_hunk:
1255 1261 continue
1256 1262 try:
1257 1263 mode = gp and gp.mode or None
1258 1264 current_file, missing = selectfile(backend, afile, bfile,
1259 1265 first_hunk, strip)
1260 1266 current_file = patcher(ui, current_file, backend, mode,
1261 1267 missing=missing, eolmode=eolmode)
1262 1268 except PatchError, inst:
1263 1269 ui.warn(str(inst) + '\n')
1264 1270 current_file = None
1265 1271 rejects += 1
1266 1272 continue
1267 1273 elif state == 'git':
1268 1274 for gp in values:
1269 gp.path = pathstrip(gp.path, strip - 1)[1]
1270 if gp.oldpath:
1271 gp.oldpath = pathstrip(gp.oldpath, strip - 1)[1]
1272 if gp.op in ('COPY', 'RENAME'):
1273 backend.copy(gp.oldpath, gp.path)
1275 backend.copy(pstrip(gp.oldpath), pstrip(gp.path))
1274 1276 else:
1275 1277 raise util.Abort(_('unsupported parser state: %s') % state)
1276 1278
1277 1279 if current_file:
1278 1280 rejects += current_file.close()
1279 1281
1280 1282 if rejects:
1281 1283 return -1
1282 1284 return err
1283 1285
1284 1286 def _externalpatch(ui, repo, patcher, patchname, strip, files,
1285 1287 similarity):
1286 1288 """use <patcher> to apply <patchname> to the working directory.
1287 1289 returns whether patch was applied with fuzz factor."""
1288 1290
1289 1291 fuzz = False
1290 1292 args = []
1291 1293 cwd = repo.root
1292 1294 if cwd:
1293 1295 args.append('-d %s' % util.shellquote(cwd))
1294 1296 fp = util.popen('%s %s -p%d < %s' % (patcher, ' '.join(args), strip,
1295 1297 util.shellquote(patchname)))
1296 1298 try:
1297 1299 for line in fp:
1298 1300 line = line.rstrip()
1299 1301 ui.note(line + '\n')
1300 1302 if line.startswith('patching file '):
1301 1303 pf = util.parsepatchoutput(line)
1302 1304 printed_file = False
1303 1305 files.setdefault(pf, None)
1304 1306 elif line.find('with fuzz') >= 0:
1305 1307 fuzz = True
1306 1308 if not printed_file:
1307 1309 ui.warn(pf + '\n')
1308 1310 printed_file = True
1309 1311 ui.warn(line + '\n')
1310 1312 elif line.find('saving rejects to file') >= 0:
1311 1313 ui.warn(line + '\n')
1312 1314 elif line.find('FAILED') >= 0:
1313 1315 if not printed_file:
1314 1316 ui.warn(pf + '\n')
1315 1317 printed_file = True
1316 1318 ui.warn(line + '\n')
1317 1319 finally:
1318 1320 if files:
1319 1321 cfiles = list(files)
1320 1322 cwd = repo.getcwd()
1321 1323 if cwd:
1322 1324 cfiles = [util.pathto(repo.root, cwd, f)
1323 1325 for f in cfile]
1324 1326 scmutil.addremove(repo, cfiles, similarity=similarity)
1325 1327 code = fp.close()
1326 1328 if code:
1327 1329 raise PatchError(_("patch command failed: %s") %
1328 1330 util.explainexit(code)[0])
1329 1331 return fuzz
1330 1332
1331 1333 def internalpatch(ui, repo, patchobj, strip, files=None, eolmode='strict',
1332 1334 similarity=0):
1333 1335 """use builtin patch to apply <patchobj> to the working directory.
1334 1336 returns whether patch was applied with fuzz factor."""
1335 1337
1336 1338 if files is None:
1337 1339 files = {}
1338 1340 if eolmode is None:
1339 1341 eolmode = ui.config('patch', 'eol', 'strict')
1340 1342 if eolmode.lower() not in eolmodes:
1341 1343 raise util.Abort(_('unsupported line endings type: %s') % eolmode)
1342 1344 eolmode = eolmode.lower()
1343 1345
1344 1346 backend = workingbackend(ui, repo, similarity)
1345 1347 try:
1346 1348 fp = open(patchobj, 'rb')
1347 1349 except TypeError:
1348 1350 fp = patchobj
1349 1351 try:
1350 1352 ret = applydiff(ui, fp, files, backend, strip=strip, eolmode=eolmode)
1351 1353 finally:
1352 1354 if fp != patchobj:
1353 1355 fp.close()
1354 1356 files.update(dict.fromkeys(backend.close()))
1355 1357 if ret < 0:
1356 1358 raise PatchError(_('patch failed to apply'))
1357 1359 return ret > 0
1358 1360
1359 1361 def patch(ui, repo, patchname, strip=1, files=None, eolmode='strict',
1360 1362 similarity=0):
1361 1363 """Apply <patchname> to the working directory.
1362 1364
1363 1365 'eolmode' specifies how end of lines should be handled. It can be:
1364 1366 - 'strict': inputs are read in binary mode, EOLs are preserved
1365 1367 - 'crlf': EOLs are ignored when patching and reset to CRLF
1366 1368 - 'lf': EOLs are ignored when patching and reset to LF
1367 1369 - None: get it from user settings, default to 'strict'
1368 1370 'eolmode' is ignored when using an external patcher program.
1369 1371
1370 1372 Returns whether patch was applied with fuzz factor.
1371 1373 """
1372 1374 patcher = ui.config('ui', 'patch')
1373 1375 if files is None:
1374 1376 files = {}
1375 1377 try:
1376 1378 if patcher:
1377 1379 return _externalpatch(ui, repo, patcher, patchname, strip,
1378 1380 files, similarity)
1379 1381 return internalpatch(ui, repo, patchname, strip, files, eolmode,
1380 1382 similarity)
1381 1383 except PatchError, err:
1382 1384 raise util.Abort(str(err))
1383 1385
1384 1386 def changedfiles(ui, repo, patchpath, strip=1):
1385 1387 backend = fsbackend(ui, repo.root)
1386 1388 fp = open(patchpath, 'rb')
1387 1389 try:
1388 1390 changed = set()
1389 1391 for state, values in iterhunks(fp):
1390 if state == 'hunk':
1391 continue
1392 elif state == 'file':
1392 if state == 'file':
1393 1393 afile, bfile, first_hunk, gp = values
1394 1394 if gp:
1395 changed.add(gp.path)
1395 changed.add(pathstrip(gp.path, strip - 1)[1])
1396 1396 if gp.op == 'RENAME':
1397 changed.add(gp.oldpath)
1397 changed.add(pathstrip(gp.oldpath, strip - 1)[1])
1398 1398 if not first_hunk:
1399 1399 continue
1400 1400 current_file, missing = selectfile(backend, afile, bfile,
1401 1401 first_hunk, strip)
1402 1402 changed.add(current_file)
1403 elif state == 'git':
1404 for gp in values:
1405 gp.path = pathstrip(gp.path, strip - 1)[1]
1406 if gp.oldpath:
1407 gp.oldpath = pathstrip(gp.oldpath, strip - 1)[1]
1408 else:
1403 elif state not in ('hunk', 'git'):
1409 1404 raise util.Abort(_('unsupported parser state: %s') % state)
1410 1405 return changed
1411 1406 finally:
1412 1407 fp.close()
1413 1408
1414 1409 def b85diff(to, tn):
1415 1410 '''print base85-encoded binary diff'''
1416 1411 def gitindex(text):
1417 1412 if not text:
1418 1413 return hex(nullid)
1419 1414 l = len(text)
1420 1415 s = util.sha1('blob %d\0' % l)
1421 1416 s.update(text)
1422 1417 return s.hexdigest()
1423 1418
1424 1419 def fmtline(line):
1425 1420 l = len(line)
1426 1421 if l <= 26:
1427 1422 l = chr(ord('A') + l - 1)
1428 1423 else:
1429 1424 l = chr(l - 26 + ord('a') - 1)
1430 1425 return '%c%s\n' % (l, base85.b85encode(line, True))
1431 1426
1432 1427 def chunk(text, csize=52):
1433 1428 l = len(text)
1434 1429 i = 0
1435 1430 while i < l:
1436 1431 yield text[i:i + csize]
1437 1432 i += csize
1438 1433
1439 1434 tohash = gitindex(to)
1440 1435 tnhash = gitindex(tn)
1441 1436 if tohash == tnhash:
1442 1437 return ""
1443 1438
1444 1439 # TODO: deltas
1445 1440 ret = ['index %s..%s\nGIT binary patch\nliteral %s\n' %
1446 1441 (tohash, tnhash, len(tn))]
1447 1442 for l in chunk(zlib.compress(tn)):
1448 1443 ret.append(fmtline(l))
1449 1444 ret.append('\n')
1450 1445 return ''.join(ret)
1451 1446
1452 1447 class GitDiffRequired(Exception):
1453 1448 pass
1454 1449
1455 1450 def diffopts(ui, opts=None, untrusted=False):
1456 1451 def get(key, name=None, getter=ui.configbool):
1457 1452 return ((opts and opts.get(key)) or
1458 1453 getter('diff', name or key, None, untrusted=untrusted))
1459 1454 return mdiff.diffopts(
1460 1455 text=opts and opts.get('text'),
1461 1456 git=get('git'),
1462 1457 nodates=get('nodates'),
1463 1458 showfunc=get('show_function', 'showfunc'),
1464 1459 ignorews=get('ignore_all_space', 'ignorews'),
1465 1460 ignorewsamount=get('ignore_space_change', 'ignorewsamount'),
1466 1461 ignoreblanklines=get('ignore_blank_lines', 'ignoreblanklines'),
1467 1462 context=get('unified', getter=ui.config))
1468 1463
1469 1464 def diff(repo, node1=None, node2=None, match=None, changes=None, opts=None,
1470 1465 losedatafn=None, prefix=''):
1471 1466 '''yields diff of changes to files between two nodes, or node and
1472 1467 working directory.
1473 1468
1474 1469 if node1 is None, use first dirstate parent instead.
1475 1470 if node2 is None, compare node1 with working directory.
1476 1471
1477 1472 losedatafn(**kwarg) is a callable run when opts.upgrade=True and
1478 1473 every time some change cannot be represented with the current
1479 1474 patch format. Return False to upgrade to git patch format, True to
1480 1475 accept the loss or raise an exception to abort the diff. It is
1481 1476 called with the name of current file being diffed as 'fn'. If set
1482 1477 to None, patches will always be upgraded to git format when
1483 1478 necessary.
1484 1479
1485 1480 prefix is a filename prefix that is prepended to all filenames on
1486 1481 display (used for subrepos).
1487 1482 '''
1488 1483
1489 1484 if opts is None:
1490 1485 opts = mdiff.defaultopts
1491 1486
1492 1487 if not node1 and not node2:
1493 1488 node1 = repo.dirstate.p1()
1494 1489
1495 1490 def lrugetfilectx():
1496 1491 cache = {}
1497 1492 order = []
1498 1493 def getfilectx(f, ctx):
1499 1494 fctx = ctx.filectx(f, filelog=cache.get(f))
1500 1495 if f not in cache:
1501 1496 if len(cache) > 20:
1502 1497 del cache[order.pop(0)]
1503 1498 cache[f] = fctx.filelog()
1504 1499 else:
1505 1500 order.remove(f)
1506 1501 order.append(f)
1507 1502 return fctx
1508 1503 return getfilectx
1509 1504 getfilectx = lrugetfilectx()
1510 1505
1511 1506 ctx1 = repo[node1]
1512 1507 ctx2 = repo[node2]
1513 1508
1514 1509 if not changes:
1515 1510 changes = repo.status(ctx1, ctx2, match=match)
1516 1511 modified, added, removed = changes[:3]
1517 1512
1518 1513 if not modified and not added and not removed:
1519 1514 return []
1520 1515
1521 1516 revs = None
1522 1517 if not repo.ui.quiet:
1523 1518 hexfunc = repo.ui.debugflag and hex or short
1524 1519 revs = [hexfunc(node) for node in [node1, node2] if node]
1525 1520
1526 1521 copy = {}
1527 1522 if opts.git or opts.upgrade:
1528 1523 copy = copies.copies(repo, ctx1, ctx2, repo[nullid])[0]
1529 1524
1530 1525 difffn = lambda opts, losedata: trydiff(repo, revs, ctx1, ctx2,
1531 1526 modified, added, removed, copy, getfilectx, opts, losedata, prefix)
1532 1527 if opts.upgrade and not opts.git:
1533 1528 try:
1534 1529 def losedata(fn):
1535 1530 if not losedatafn or not losedatafn(fn=fn):
1536 1531 raise GitDiffRequired()
1537 1532 # Buffer the whole output until we are sure it can be generated
1538 1533 return list(difffn(opts.copy(git=False), losedata))
1539 1534 except GitDiffRequired:
1540 1535 return difffn(opts.copy(git=True), None)
1541 1536 else:
1542 1537 return difffn(opts, None)
1543 1538
1544 1539 def difflabel(func, *args, **kw):
1545 1540 '''yields 2-tuples of (output, label) based on the output of func()'''
1546 1541 prefixes = [('diff', 'diff.diffline'),
1547 1542 ('copy', 'diff.extended'),
1548 1543 ('rename', 'diff.extended'),
1549 1544 ('old', 'diff.extended'),
1550 1545 ('new', 'diff.extended'),
1551 1546 ('deleted', 'diff.extended'),
1552 1547 ('---', 'diff.file_a'),
1553 1548 ('+++', 'diff.file_b'),
1554 1549 ('@@', 'diff.hunk'),
1555 1550 ('-', 'diff.deleted'),
1556 1551 ('+', 'diff.inserted')]
1557 1552
1558 1553 for chunk in func(*args, **kw):
1559 1554 lines = chunk.split('\n')
1560 1555 for i, line in enumerate(lines):
1561 1556 if i != 0:
1562 1557 yield ('\n', '')
1563 1558 stripline = line
1564 1559 if line and line[0] in '+-':
1565 1560 # highlight trailing whitespace, but only in changed lines
1566 1561 stripline = line.rstrip()
1567 1562 for prefix, label in prefixes:
1568 1563 if stripline.startswith(prefix):
1569 1564 yield (stripline, label)
1570 1565 break
1571 1566 else:
1572 1567 yield (line, '')
1573 1568 if line != stripline:
1574 1569 yield (line[len(stripline):], 'diff.trailingwhitespace')
1575 1570
1576 1571 def diffui(*args, **kw):
1577 1572 '''like diff(), but yields 2-tuples of (output, label) for ui.write()'''
1578 1573 return difflabel(diff, *args, **kw)
1579 1574
1580 1575
1581 1576 def _addmodehdr(header, omode, nmode):
1582 1577 if omode != nmode:
1583 1578 header.append('old mode %s\n' % omode)
1584 1579 header.append('new mode %s\n' % nmode)
1585 1580
1586 1581 def trydiff(repo, revs, ctx1, ctx2, modified, added, removed,
1587 1582 copy, getfilectx, opts, losedatafn, prefix):
1588 1583
1589 1584 def join(f):
1590 1585 return os.path.join(prefix, f)
1591 1586
1592 1587 date1 = util.datestr(ctx1.date())
1593 1588 man1 = ctx1.manifest()
1594 1589
1595 1590 gone = set()
1596 1591 gitmode = {'l': '120000', 'x': '100755', '': '100644'}
1597 1592
1598 1593 copyto = dict([(v, k) for k, v in copy.items()])
1599 1594
1600 1595 if opts.git:
1601 1596 revs = None
1602 1597
1603 1598 for f in sorted(modified + added + removed):
1604 1599 to = None
1605 1600 tn = None
1606 1601 dodiff = True
1607 1602 header = []
1608 1603 if f in man1:
1609 1604 to = getfilectx(f, ctx1).data()
1610 1605 if f not in removed:
1611 1606 tn = getfilectx(f, ctx2).data()
1612 1607 a, b = f, f
1613 1608 if opts.git or losedatafn:
1614 1609 if f in added:
1615 1610 mode = gitmode[ctx2.flags(f)]
1616 1611 if f in copy or f in copyto:
1617 1612 if opts.git:
1618 1613 if f in copy:
1619 1614 a = copy[f]
1620 1615 else:
1621 1616 a = copyto[f]
1622 1617 omode = gitmode[man1.flags(a)]
1623 1618 _addmodehdr(header, omode, mode)
1624 1619 if a in removed and a not in gone:
1625 1620 op = 'rename'
1626 1621 gone.add(a)
1627 1622 else:
1628 1623 op = 'copy'
1629 1624 header.append('%s from %s\n' % (op, join(a)))
1630 1625 header.append('%s to %s\n' % (op, join(f)))
1631 1626 to = getfilectx(a, ctx1).data()
1632 1627 else:
1633 1628 losedatafn(f)
1634 1629 else:
1635 1630 if opts.git:
1636 1631 header.append('new file mode %s\n' % mode)
1637 1632 elif ctx2.flags(f):
1638 1633 losedatafn(f)
1639 1634 # In theory, if tn was copied or renamed we should check
1640 1635 # if the source is binary too but the copy record already
1641 1636 # forces git mode.
1642 1637 if util.binary(tn):
1643 1638 if opts.git:
1644 1639 dodiff = 'binary'
1645 1640 else:
1646 1641 losedatafn(f)
1647 1642 if not opts.git and not tn:
1648 1643 # regular diffs cannot represent new empty file
1649 1644 losedatafn(f)
1650 1645 elif f in removed:
1651 1646 if opts.git:
1652 1647 # have we already reported a copy above?
1653 1648 if ((f in copy and copy[f] in added
1654 1649 and copyto[copy[f]] == f) or
1655 1650 (f in copyto and copyto[f] in added
1656 1651 and copy[copyto[f]] == f)):
1657 1652 dodiff = False
1658 1653 else:
1659 1654 header.append('deleted file mode %s\n' %
1660 1655 gitmode[man1.flags(f)])
1661 1656 elif not to or util.binary(to):
1662 1657 # regular diffs cannot represent empty file deletion
1663 1658 losedatafn(f)
1664 1659 else:
1665 1660 oflag = man1.flags(f)
1666 1661 nflag = ctx2.flags(f)
1667 1662 binary = util.binary(to) or util.binary(tn)
1668 1663 if opts.git:
1669 1664 _addmodehdr(header, gitmode[oflag], gitmode[nflag])
1670 1665 if binary:
1671 1666 dodiff = 'binary'
1672 1667 elif binary or nflag != oflag:
1673 1668 losedatafn(f)
1674 1669 if opts.git:
1675 1670 header.insert(0, mdiff.diffline(revs, join(a), join(b), opts))
1676 1671
1677 1672 if dodiff:
1678 1673 if dodiff == 'binary':
1679 1674 text = b85diff(to, tn)
1680 1675 else:
1681 1676 text = mdiff.unidiff(to, date1,
1682 1677 # ctx2 date may be dynamic
1683 1678 tn, util.datestr(ctx2.date()),
1684 1679 join(a), join(b), revs, opts=opts)
1685 1680 if header and (text or len(header) > 1):
1686 1681 yield ''.join(header)
1687 1682 if text:
1688 1683 yield text
1689 1684
1690 1685 def diffstatdata(lines):
1691 1686 diffre = re.compile('^diff .*-r [a-z0-9]+\s(.*)$')
1692 1687
1693 1688 filename, adds, removes = None, 0, 0
1694 1689 for line in lines:
1695 1690 if line.startswith('diff'):
1696 1691 if filename:
1697 1692 isbinary = adds == 0 and removes == 0
1698 1693 yield (filename, adds, removes, isbinary)
1699 1694 # set numbers to 0 anyway when starting new file
1700 1695 adds, removes = 0, 0
1701 1696 if line.startswith('diff --git'):
1702 1697 filename = gitre.search(line).group(1)
1703 1698 elif line.startswith('diff -r'):
1704 1699 # format: "diff -r ... -r ... filename"
1705 1700 filename = diffre.search(line).group(1)
1706 1701 elif line.startswith('+') and not line.startswith('+++'):
1707 1702 adds += 1
1708 1703 elif line.startswith('-') and not line.startswith('---'):
1709 1704 removes += 1
1710 1705 if filename:
1711 1706 isbinary = adds == 0 and removes == 0
1712 1707 yield (filename, adds, removes, isbinary)
1713 1708
1714 1709 def diffstat(lines, width=80, git=False):
1715 1710 output = []
1716 1711 stats = list(diffstatdata(lines))
1717 1712
1718 1713 maxtotal, maxname = 0, 0
1719 1714 totaladds, totalremoves = 0, 0
1720 1715 hasbinary = False
1721 1716
1722 1717 sized = [(filename, adds, removes, isbinary, encoding.colwidth(filename))
1723 1718 for filename, adds, removes, isbinary in stats]
1724 1719
1725 1720 for filename, adds, removes, isbinary, namewidth in sized:
1726 1721 totaladds += adds
1727 1722 totalremoves += removes
1728 1723 maxname = max(maxname, namewidth)
1729 1724 maxtotal = max(maxtotal, adds + removes)
1730 1725 if isbinary:
1731 1726 hasbinary = True
1732 1727
1733 1728 countwidth = len(str(maxtotal))
1734 1729 if hasbinary and countwidth < 3:
1735 1730 countwidth = 3
1736 1731 graphwidth = width - countwidth - maxname - 6
1737 1732 if graphwidth < 10:
1738 1733 graphwidth = 10
1739 1734
1740 1735 def scale(i):
1741 1736 if maxtotal <= graphwidth:
1742 1737 return i
1743 1738 # If diffstat runs out of room it doesn't print anything,
1744 1739 # which isn't very useful, so always print at least one + or -
1745 1740 # if there were at least some changes.
1746 1741 return max(i * graphwidth // maxtotal, int(bool(i)))
1747 1742
1748 1743 for filename, adds, removes, isbinary, namewidth in sized:
1749 1744 if git and isbinary:
1750 1745 count = 'Bin'
1751 1746 else:
1752 1747 count = adds + removes
1753 1748 pluses = '+' * scale(adds)
1754 1749 minuses = '-' * scale(removes)
1755 1750 output.append(' %s%s | %*s %s%s\n' %
1756 1751 (filename, ' ' * (maxname - namewidth),
1757 1752 countwidth, count,
1758 1753 pluses, minuses))
1759 1754
1760 1755 if stats:
1761 1756 output.append(_(' %d files changed, %d insertions(+), %d deletions(-)\n')
1762 1757 % (len(stats), totaladds, totalremoves))
1763 1758
1764 1759 return ''.join(output)
1765 1760
1766 1761 def diffstatui(*args, **kw):
1767 1762 '''like diffstat(), but yields 2-tuples of (output, label) for
1768 1763 ui.write()
1769 1764 '''
1770 1765
1771 1766 for line in diffstat(*args, **kw).splitlines():
1772 1767 if line and line[-1] in '+-':
1773 1768 name, graph = line.rsplit(' ', 1)
1774 1769 yield (name + ' ', '')
1775 1770 m = re.search(r'\++', graph)
1776 1771 if m:
1777 1772 yield (m.group(0), 'diffstat.inserted')
1778 1773 m = re.search(r'-+', graph)
1779 1774 if m:
1780 1775 yield (m.group(0), 'diffstat.deleted')
1781 1776 else:
1782 1777 yield (line, '')
1783 1778 yield ('\n', '')
General Comments 0
You need to be logged in to leave comments. Login now