##// END OF EJS Templates
patch: refactor iterhunks() regular and binary files emission
Patrick Mezard -
r14383:1bd52cb1 default
parent child Browse files
Show More
@@ -1,1780 +1,1778 b''
1 1 # patch.py - patch file parsing routines
2 2 #
3 3 # Copyright 2006 Brendan Cully <brendan@kublai.com>
4 4 # Copyright 2007 Chris Mason <chris.mason@oracle.com>
5 5 #
6 6 # This software may be used and distributed according to the terms of the
7 7 # GNU General Public License version 2 or any later version.
8 8
9 9 import cStringIO, email.Parser, os, errno, re
10 10 import tempfile, zlib
11 11
12 12 from i18n import _
13 13 from node import hex, nullid, short
14 14 import base85, mdiff, scmutil, util, diffhelpers, copies, encoding
15 15
16 16 gitre = re.compile('diff --git a/(.*) b/(.*)')
17 17
18 18 class PatchError(Exception):
19 19 pass
20 20
21 21
22 22 # public functions
23 23
24 24 def split(stream):
25 25 '''return an iterator of individual patches from a stream'''
26 26 def isheader(line, inheader):
27 27 if inheader and line[0] in (' ', '\t'):
28 28 # continuation
29 29 return True
30 30 if line[0] in (' ', '-', '+'):
31 31 # diff line - don't check for header pattern in there
32 32 return False
33 33 l = line.split(': ', 1)
34 34 return len(l) == 2 and ' ' not in l[0]
35 35
36 36 def chunk(lines):
37 37 return cStringIO.StringIO(''.join(lines))
38 38
39 39 def hgsplit(stream, cur):
40 40 inheader = True
41 41
42 42 for line in stream:
43 43 if not line.strip():
44 44 inheader = False
45 45 if not inheader and line.startswith('# HG changeset patch'):
46 46 yield chunk(cur)
47 47 cur = []
48 48 inheader = True
49 49
50 50 cur.append(line)
51 51
52 52 if cur:
53 53 yield chunk(cur)
54 54
55 55 def mboxsplit(stream, cur):
56 56 for line in stream:
57 57 if line.startswith('From '):
58 58 for c in split(chunk(cur[1:])):
59 59 yield c
60 60 cur = []
61 61
62 62 cur.append(line)
63 63
64 64 if cur:
65 65 for c in split(chunk(cur[1:])):
66 66 yield c
67 67
68 68 def mimesplit(stream, cur):
69 69 def msgfp(m):
70 70 fp = cStringIO.StringIO()
71 71 g = email.Generator.Generator(fp, mangle_from_=False)
72 72 g.flatten(m)
73 73 fp.seek(0)
74 74 return fp
75 75
76 76 for line in stream:
77 77 cur.append(line)
78 78 c = chunk(cur)
79 79
80 80 m = email.Parser.Parser().parse(c)
81 81 if not m.is_multipart():
82 82 yield msgfp(m)
83 83 else:
84 84 ok_types = ('text/plain', 'text/x-diff', 'text/x-patch')
85 85 for part in m.walk():
86 86 ct = part.get_content_type()
87 87 if ct not in ok_types:
88 88 continue
89 89 yield msgfp(part)
90 90
91 91 def headersplit(stream, cur):
92 92 inheader = False
93 93
94 94 for line in stream:
95 95 if not inheader and isheader(line, inheader):
96 96 yield chunk(cur)
97 97 cur = []
98 98 inheader = True
99 99 if inheader and not isheader(line, inheader):
100 100 inheader = False
101 101
102 102 cur.append(line)
103 103
104 104 if cur:
105 105 yield chunk(cur)
106 106
107 107 def remainder(cur):
108 108 yield chunk(cur)
109 109
110 110 class fiter(object):
111 111 def __init__(self, fp):
112 112 self.fp = fp
113 113
114 114 def __iter__(self):
115 115 return self
116 116
117 117 def next(self):
118 118 l = self.fp.readline()
119 119 if not l:
120 120 raise StopIteration
121 121 return l
122 122
123 123 inheader = False
124 124 cur = []
125 125
126 126 mimeheaders = ['content-type']
127 127
128 128 if not hasattr(stream, 'next'):
129 129 # http responses, for example, have readline but not next
130 130 stream = fiter(stream)
131 131
132 132 for line in stream:
133 133 cur.append(line)
134 134 if line.startswith('# HG changeset patch'):
135 135 return hgsplit(stream, cur)
136 136 elif line.startswith('From '):
137 137 return mboxsplit(stream, cur)
138 138 elif isheader(line, inheader):
139 139 inheader = True
140 140 if line.split(':', 1)[0].lower() in mimeheaders:
141 141 # let email parser handle this
142 142 return mimesplit(stream, cur)
143 143 elif line.startswith('--- ') and inheader:
144 144 # No evil headers seen by diff start, split by hand
145 145 return headersplit(stream, cur)
146 146 # Not enough info, keep reading
147 147
148 148 # if we are here, we have a very plain patch
149 149 return remainder(cur)
150 150
151 151 def extract(ui, fileobj):
152 152 '''extract patch from data read from fileobj.
153 153
154 154 patch can be a normal patch or contained in an email message.
155 155
156 156 return tuple (filename, message, user, date, branch, node, p1, p2).
157 157 Any item in the returned tuple can be None. If filename is None,
158 158 fileobj did not contain a patch. Caller must unlink filename when done.'''
159 159
160 160 # attempt to detect the start of a patch
161 161 # (this heuristic is borrowed from quilt)
162 162 diffre = re.compile(r'^(?:Index:[ \t]|diff[ \t]|RCS file: |'
163 163 r'retrieving revision [0-9]+(\.[0-9]+)*$|'
164 164 r'---[ \t].*?^\+\+\+[ \t]|'
165 165 r'\*\*\*[ \t].*?^---[ \t])', re.MULTILINE|re.DOTALL)
166 166
167 167 fd, tmpname = tempfile.mkstemp(prefix='hg-patch-')
168 168 tmpfp = os.fdopen(fd, 'w')
169 169 try:
170 170 msg = email.Parser.Parser().parse(fileobj)
171 171
172 172 subject = msg['Subject']
173 173 user = msg['From']
174 174 if not subject and not user:
175 175 # Not an email, restore parsed headers if any
176 176 subject = '\n'.join(': '.join(h) for h in msg.items()) + '\n'
177 177
178 178 gitsendmail = 'git-send-email' in msg.get('X-Mailer', '')
179 179 # should try to parse msg['Date']
180 180 date = None
181 181 nodeid = None
182 182 branch = None
183 183 parents = []
184 184
185 185 if subject:
186 186 if subject.startswith('[PATCH'):
187 187 pend = subject.find(']')
188 188 if pend >= 0:
189 189 subject = subject[pend + 1:].lstrip()
190 190 subject = subject.replace('\n\t', ' ')
191 191 ui.debug('Subject: %s\n' % subject)
192 192 if user:
193 193 ui.debug('From: %s\n' % user)
194 194 diffs_seen = 0
195 195 ok_types = ('text/plain', 'text/x-diff', 'text/x-patch')
196 196 message = ''
197 197 for part in msg.walk():
198 198 content_type = part.get_content_type()
199 199 ui.debug('Content-Type: %s\n' % content_type)
200 200 if content_type not in ok_types:
201 201 continue
202 202 payload = part.get_payload(decode=True)
203 203 m = diffre.search(payload)
204 204 if m:
205 205 hgpatch = False
206 206 hgpatchheader = False
207 207 ignoretext = False
208 208
209 209 ui.debug('found patch at byte %d\n' % m.start(0))
210 210 diffs_seen += 1
211 211 cfp = cStringIO.StringIO()
212 212 for line in payload[:m.start(0)].splitlines():
213 213 if line.startswith('# HG changeset patch') and not hgpatch:
214 214 ui.debug('patch generated by hg export\n')
215 215 hgpatch = True
216 216 hgpatchheader = True
217 217 # drop earlier commit message content
218 218 cfp.seek(0)
219 219 cfp.truncate()
220 220 subject = None
221 221 elif hgpatchheader:
222 222 if line.startswith('# User '):
223 223 user = line[7:]
224 224 ui.debug('From: %s\n' % user)
225 225 elif line.startswith("# Date "):
226 226 date = line[7:]
227 227 elif line.startswith("# Branch "):
228 228 branch = line[9:]
229 229 elif line.startswith("# Node ID "):
230 230 nodeid = line[10:]
231 231 elif line.startswith("# Parent "):
232 232 parents.append(line[10:])
233 233 elif not line.startswith("# "):
234 234 hgpatchheader = False
235 235 elif line == '---' and gitsendmail:
236 236 ignoretext = True
237 237 if not hgpatchheader and not ignoretext:
238 238 cfp.write(line)
239 239 cfp.write('\n')
240 240 message = cfp.getvalue()
241 241 if tmpfp:
242 242 tmpfp.write(payload)
243 243 if not payload.endswith('\n'):
244 244 tmpfp.write('\n')
245 245 elif not diffs_seen and message and content_type == 'text/plain':
246 246 message += '\n' + payload
247 247 except:
248 248 tmpfp.close()
249 249 os.unlink(tmpname)
250 250 raise
251 251
252 252 if subject and not message.startswith(subject):
253 253 message = '%s\n%s' % (subject, message)
254 254 tmpfp.close()
255 255 if not diffs_seen:
256 256 os.unlink(tmpname)
257 257 return None, message, user, date, branch, None, None, None
258 258 p1 = parents and parents.pop(0) or None
259 259 p2 = parents and parents.pop(0) or None
260 260 return tmpname, message, user, date, branch, nodeid, p1, p2
261 261
262 262 class patchmeta(object):
263 263 """Patched file metadata
264 264
265 265 'op' is the performed operation within ADD, DELETE, RENAME, MODIFY
266 266 or COPY. 'path' is patched file path. 'oldpath' is set to the
267 267 origin file when 'op' is either COPY or RENAME, None otherwise. If
268 268 file mode is changed, 'mode' is a tuple (islink, isexec) where
269 269 'islink' is True if the file is a symlink and 'isexec' is True if
270 270 the file is executable. Otherwise, 'mode' is None.
271 271 """
272 272 def __init__(self, path):
273 273 self.path = path
274 274 self.oldpath = None
275 275 self.mode = None
276 276 self.op = 'MODIFY'
277 277 self.binary = False
278 278
279 279 def setmode(self, mode):
280 280 islink = mode & 020000
281 281 isexec = mode & 0100
282 282 self.mode = (islink, isexec)
283 283
284 284 def __repr__(self):
285 285 return "<patchmeta %s %r>" % (self.op, self.path)
286 286
287 287 def readgitpatch(lr):
288 288 """extract git-style metadata about patches from <patchname>"""
289 289
290 290 # Filter patch for git information
291 291 gp = None
292 292 gitpatches = []
293 293 for line in lr:
294 294 line = line.rstrip(' \r\n')
295 295 if line.startswith('diff --git'):
296 296 m = gitre.match(line)
297 297 if m:
298 298 if gp:
299 299 gitpatches.append(gp)
300 300 dst = m.group(2)
301 301 gp = patchmeta(dst)
302 302 elif gp:
303 303 if line.startswith('--- '):
304 304 gitpatches.append(gp)
305 305 gp = None
306 306 continue
307 307 if line.startswith('rename from '):
308 308 gp.op = 'RENAME'
309 309 gp.oldpath = line[12:]
310 310 elif line.startswith('rename to '):
311 311 gp.path = line[10:]
312 312 elif line.startswith('copy from '):
313 313 gp.op = 'COPY'
314 314 gp.oldpath = line[10:]
315 315 elif line.startswith('copy to '):
316 316 gp.path = line[8:]
317 317 elif line.startswith('deleted file'):
318 318 gp.op = 'DELETE'
319 319 elif line.startswith('new file mode '):
320 320 gp.op = 'ADD'
321 321 gp.setmode(int(line[-6:], 8))
322 322 elif line.startswith('new mode '):
323 323 gp.setmode(int(line[-6:], 8))
324 324 elif line.startswith('GIT binary patch'):
325 325 gp.binary = True
326 326 if gp:
327 327 gitpatches.append(gp)
328 328
329 329 return gitpatches
330 330
331 331 class linereader(object):
332 332 # simple class to allow pushing lines back into the input stream
333 333 def __init__(self, fp, textmode=False):
334 334 self.fp = fp
335 335 self.buf = []
336 336 self.textmode = textmode
337 337 self.eol = None
338 338
339 339 def push(self, line):
340 340 if line is not None:
341 341 self.buf.append(line)
342 342
343 343 def readline(self):
344 344 if self.buf:
345 345 l = self.buf[0]
346 346 del self.buf[0]
347 347 return l
348 348 l = self.fp.readline()
349 349 if not self.eol:
350 350 if l.endswith('\r\n'):
351 351 self.eol = '\r\n'
352 352 elif l.endswith('\n'):
353 353 self.eol = '\n'
354 354 if self.textmode and l.endswith('\r\n'):
355 355 l = l[:-2] + '\n'
356 356 return l
357 357
358 358 def __iter__(self):
359 359 while 1:
360 360 l = self.readline()
361 361 if not l:
362 362 break
363 363 yield l
364 364
365 365 class abstractbackend(object):
366 366 def __init__(self, ui):
367 367 self.ui = ui
368 368
369 369 def readlines(self, fname):
370 370 """Return target file lines, or its content as a single line
371 371 for symlinks.
372 372 """
373 373 raise NotImplementedError
374 374
375 375 def writelines(self, fname, lines, mode):
376 376 """Write lines to target file. mode is a (islink, isexec)
377 377 tuple, or None if there is no mode information.
378 378 """
379 379 raise NotImplementedError
380 380
381 381 def unlink(self, fname):
382 382 """Unlink target file."""
383 383 raise NotImplementedError
384 384
385 385 def writerej(self, fname, failed, total, lines):
386 386 """Write rejected lines for fname. total is the number of hunks
387 387 which failed to apply and total the total number of hunks for this
388 388 files.
389 389 """
390 390 pass
391 391
392 392 def copy(self, src, dst):
393 393 """Copy src file into dst file. Create intermediate directories if
394 394 necessary. Files are specified relatively to the patching base
395 395 directory.
396 396 """
397 397 raise NotImplementedError
398 398
399 399 def exists(self, fname):
400 400 raise NotImplementedError
401 401
402 402 def setmode(self, fname, islink, isexec):
403 403 """Change target file mode."""
404 404 raise NotImplementedError
405 405
406 406 class fsbackend(abstractbackend):
407 407 def __init__(self, ui, basedir):
408 408 super(fsbackend, self).__init__(ui)
409 409 self.opener = scmutil.opener(basedir)
410 410
411 411 def _join(self, f):
412 412 return os.path.join(self.opener.base, f)
413 413
414 414 def readlines(self, fname):
415 415 if os.path.islink(self._join(fname)):
416 416 return [os.readlink(self._join(fname))]
417 417 fp = self.opener(fname, 'r')
418 418 try:
419 419 return list(fp)
420 420 finally:
421 421 fp.close()
422 422
423 423 def writelines(self, fname, lines, mode):
424 424 if not mode:
425 425 # Preserve mode information
426 426 isexec, islink = False, False
427 427 try:
428 428 isexec = os.lstat(self._join(fname)).st_mode & 0100 != 0
429 429 islink = os.path.islink(self._join(fname))
430 430 except OSError, e:
431 431 if e.errno != errno.ENOENT:
432 432 raise
433 433 else:
434 434 islink, isexec = mode
435 435 if islink:
436 436 self.opener.symlink(''.join(lines), fname)
437 437 else:
438 438 self.opener(fname, 'w').writelines(lines)
439 439 if isexec:
440 440 util.setflags(self._join(fname), False, True)
441 441
442 442 def unlink(self, fname):
443 443 try:
444 444 util.unlinkpath(self._join(fname))
445 445 except OSError, inst:
446 446 if inst.errno != errno.ENOENT:
447 447 raise
448 448
449 449 def writerej(self, fname, failed, total, lines):
450 450 fname = fname + ".rej"
451 451 self.ui.warn(
452 452 _("%d out of %d hunks FAILED -- saving rejects to file %s\n") %
453 453 (failed, total, fname))
454 454 fp = self.opener(fname, 'w')
455 455 fp.writelines(lines)
456 456 fp.close()
457 457
458 458 def copy(self, src, dst):
459 459 basedir = self.opener.base
460 460 abssrc, absdst = [scmutil.canonpath(basedir, basedir, x)
461 461 for x in [src, dst]]
462 462 if os.path.lexists(absdst):
463 463 raise util.Abort(_("cannot create %s: destination already exists")
464 464 % dst)
465 465 dstdir = os.path.dirname(absdst)
466 466 if dstdir and not os.path.isdir(dstdir):
467 467 try:
468 468 os.makedirs(dstdir)
469 469 except IOError:
470 470 raise util.Abort(
471 471 _("cannot create %s: unable to create destination directory")
472 472 % dst)
473 473 util.copyfile(abssrc, absdst)
474 474
475 475 def exists(self, fname):
476 476 return os.path.lexists(self._join(fname))
477 477
478 478 def setmode(self, fname, islink, isexec):
479 479 util.setflags(self._join(fname), islink, isexec)
480 480
481 481 class workingbackend(fsbackend):
482 482 def __init__(self, ui, repo, similarity):
483 483 super(workingbackend, self).__init__(ui, repo.root)
484 484 self.repo = repo
485 485 self.similarity = similarity
486 486 self.removed = set()
487 487 self.changed = set()
488 488 self.copied = []
489 489
490 490 def writelines(self, fname, lines, mode):
491 491 super(workingbackend, self).writelines(fname, lines, mode)
492 492 self.changed.add(fname)
493 493
494 494 def unlink(self, fname):
495 495 super(workingbackend, self).unlink(fname)
496 496 self.removed.add(fname)
497 497 self.changed.add(fname)
498 498
499 499 def copy(self, src, dst):
500 500 super(workingbackend, self).copy(src, dst)
501 501 self.copied.append((src, dst))
502 502 self.changed.add(dst)
503 503
504 504 def setmode(self, fname, islink, isexec):
505 505 super(workingbackend, self).setmode(fname, islink, isexec)
506 506 self.changed.add(fname)
507 507
508 508 def close(self):
509 509 wctx = self.repo[None]
510 510 addremoved = set(self.changed)
511 511 for src, dst in self.copied:
512 512 scmutil.dirstatecopy(self.ui, self.repo, wctx, src, dst)
513 513 addremoved.discard(src)
514 514 if (not self.similarity) and self.removed:
515 515 wctx.remove(sorted(self.removed))
516 516 if addremoved:
517 517 cwd = self.repo.getcwd()
518 518 if cwd:
519 519 addremoved = [util.pathto(self.repo.root, cwd, f)
520 520 for f in addremoved]
521 521 scmutil.addremove(self.repo, addremoved, similarity=self.similarity)
522 522 return sorted(self.changed)
523 523
524 524 # @@ -start,len +start,len @@ or @@ -start +start @@ if len is 1
525 525 unidesc = re.compile('@@ -(\d+)(,(\d+))? \+(\d+)(,(\d+))? @@')
526 526 contextdesc = re.compile('(---|\*\*\*) (\d+)(,(\d+))? (---|\*\*\*)')
527 527 eolmodes = ['strict', 'crlf', 'lf', 'auto']
528 528
529 529 class patchfile(object):
530 530 def __init__(self, ui, fname, backend, mode, missing=False,
531 531 eolmode='strict'):
532 532 self.fname = fname
533 533 self.eolmode = eolmode
534 534 self.eol = None
535 535 self.backend = backend
536 536 self.ui = ui
537 537 self.lines = []
538 538 self.exists = False
539 539 self.missing = missing
540 540 self.mode = mode
541 541 if not missing:
542 542 try:
543 543 self.lines = self.backend.readlines(fname)
544 544 if self.lines:
545 545 # Normalize line endings
546 546 if self.lines[0].endswith('\r\n'):
547 547 self.eol = '\r\n'
548 548 elif self.lines[0].endswith('\n'):
549 549 self.eol = '\n'
550 550 if eolmode != 'strict':
551 551 nlines = []
552 552 for l in self.lines:
553 553 if l.endswith('\r\n'):
554 554 l = l[:-2] + '\n'
555 555 nlines.append(l)
556 556 self.lines = nlines
557 557 self.exists = True
558 558 except IOError:
559 559 pass
560 560 else:
561 561 self.ui.warn(_("unable to find '%s' for patching\n") % self.fname)
562 562
563 563 self.hash = {}
564 564 self.dirty = 0
565 565 self.offset = 0
566 566 self.skew = 0
567 567 self.rej = []
568 568 self.fileprinted = False
569 569 self.printfile(False)
570 570 self.hunks = 0
571 571
572 572 def writelines(self, fname, lines, mode):
573 573 if self.eolmode == 'auto':
574 574 eol = self.eol
575 575 elif self.eolmode == 'crlf':
576 576 eol = '\r\n'
577 577 else:
578 578 eol = '\n'
579 579
580 580 if self.eolmode != 'strict' and eol and eol != '\n':
581 581 rawlines = []
582 582 for l in lines:
583 583 if l and l[-1] == '\n':
584 584 l = l[:-1] + eol
585 585 rawlines.append(l)
586 586 lines = rawlines
587 587
588 588 self.backend.writelines(fname, lines, mode)
589 589
590 590 def printfile(self, warn):
591 591 if self.fileprinted:
592 592 return
593 593 if warn or self.ui.verbose:
594 594 self.fileprinted = True
595 595 s = _("patching file %s\n") % self.fname
596 596 if warn:
597 597 self.ui.warn(s)
598 598 else:
599 599 self.ui.note(s)
600 600
601 601
602 602 def findlines(self, l, linenum):
603 603 # looks through the hash and finds candidate lines. The
604 604 # result is a list of line numbers sorted based on distance
605 605 # from linenum
606 606
607 607 cand = self.hash.get(l, [])
608 608 if len(cand) > 1:
609 609 # resort our list of potentials forward then back.
610 610 cand.sort(key=lambda x: abs(x - linenum))
611 611 return cand
612 612
613 613 def write_rej(self):
614 614 # our rejects are a little different from patch(1). This always
615 615 # creates rejects in the same form as the original patch. A file
616 616 # header is inserted so that you can run the reject through patch again
617 617 # without having to type the filename.
618 618 if not self.rej:
619 619 return
620 620 base = os.path.basename(self.fname)
621 621 lines = ["--- %s\n+++ %s\n" % (base, base)]
622 622 for x in self.rej:
623 623 for l in x.hunk:
624 624 lines.append(l)
625 625 if l[-1] != '\n':
626 626 lines.append("\n\ No newline at end of file\n")
627 627 self.backend.writerej(self.fname, len(self.rej), self.hunks, lines)
628 628
629 629 def apply(self, h):
630 630 if not h.complete():
631 631 raise PatchError(_("bad hunk #%d %s (%d %d %d %d)") %
632 632 (h.number, h.desc, len(h.a), h.lena, len(h.b),
633 633 h.lenb))
634 634
635 635 self.hunks += 1
636 636
637 637 if self.missing:
638 638 self.rej.append(h)
639 639 return -1
640 640
641 641 if self.exists and h.createfile():
642 642 self.ui.warn(_("file %s already exists\n") % self.fname)
643 643 self.rej.append(h)
644 644 return -1
645 645
646 646 if isinstance(h, binhunk):
647 647 if h.rmfile():
648 648 self.backend.unlink(self.fname)
649 649 else:
650 650 self.lines[:] = h.new()
651 651 self.offset += len(h.new())
652 652 self.dirty = True
653 653 return 0
654 654
655 655 horig = h
656 656 if (self.eolmode in ('crlf', 'lf')
657 657 or self.eolmode == 'auto' and self.eol):
658 658 # If new eols are going to be normalized, then normalize
659 659 # hunk data before patching. Otherwise, preserve input
660 660 # line-endings.
661 661 h = h.getnormalized()
662 662
663 663 # fast case first, no offsets, no fuzz
664 664 old = h.old()
665 665 # patch starts counting at 1 unless we are adding the file
666 666 if h.starta == 0:
667 667 start = 0
668 668 else:
669 669 start = h.starta + self.offset - 1
670 670 orig_start = start
671 671 # if there's skew we want to emit the "(offset %d lines)" even
672 672 # when the hunk cleanly applies at start + skew, so skip the
673 673 # fast case code
674 674 if self.skew == 0 and diffhelpers.testhunk(old, self.lines, start) == 0:
675 675 if h.rmfile():
676 676 self.backend.unlink(self.fname)
677 677 else:
678 678 self.lines[start : start + h.lena] = h.new()
679 679 self.offset += h.lenb - h.lena
680 680 self.dirty = True
681 681 return 0
682 682
683 683 # ok, we couldn't match the hunk. Lets look for offsets and fuzz it
684 684 self.hash = {}
685 685 for x, s in enumerate(self.lines):
686 686 self.hash.setdefault(s, []).append(x)
687 687 if h.hunk[-1][0] != ' ':
688 688 # if the hunk tried to put something at the bottom of the file
689 689 # override the start line and use eof here
690 690 search_start = len(self.lines)
691 691 else:
692 692 search_start = orig_start + self.skew
693 693
694 694 for fuzzlen in xrange(3):
695 695 for toponly in [True, False]:
696 696 old = h.old(fuzzlen, toponly)
697 697
698 698 cand = self.findlines(old[0][1:], search_start)
699 699 for l in cand:
700 700 if diffhelpers.testhunk(old, self.lines, l) == 0:
701 701 newlines = h.new(fuzzlen, toponly)
702 702 self.lines[l : l + len(old)] = newlines
703 703 self.offset += len(newlines) - len(old)
704 704 self.skew = l - orig_start
705 705 self.dirty = True
706 706 offset = l - orig_start - fuzzlen
707 707 if fuzzlen:
708 708 msg = _("Hunk #%d succeeded at %d "
709 709 "with fuzz %d "
710 710 "(offset %d lines).\n")
711 711 self.printfile(True)
712 712 self.ui.warn(msg %
713 713 (h.number, l + 1, fuzzlen, offset))
714 714 else:
715 715 msg = _("Hunk #%d succeeded at %d "
716 716 "(offset %d lines).\n")
717 717 self.ui.note(msg % (h.number, l + 1, offset))
718 718 return fuzzlen
719 719 self.printfile(True)
720 720 self.ui.warn(_("Hunk #%d FAILED at %d\n") % (h.number, orig_start))
721 721 self.rej.append(horig)
722 722 return -1
723 723
724 724 def close(self):
725 725 if self.dirty:
726 726 self.writelines(self.fname, self.lines, self.mode)
727 727 self.write_rej()
728 728 return len(self.rej)
729 729
730 730 class hunk(object):
731 731 def __init__(self, desc, num, lr, context, create=False, remove=False):
732 732 self.number = num
733 733 self.desc = desc
734 734 self.hunk = [desc]
735 735 self.a = []
736 736 self.b = []
737 737 self.starta = self.lena = None
738 738 self.startb = self.lenb = None
739 739 if lr is not None:
740 740 if context:
741 741 self.read_context_hunk(lr)
742 742 else:
743 743 self.read_unified_hunk(lr)
744 744 self.create = create
745 745 self.remove = remove and not create
746 746
747 747 def getnormalized(self):
748 748 """Return a copy with line endings normalized to LF."""
749 749
750 750 def normalize(lines):
751 751 nlines = []
752 752 for line in lines:
753 753 if line.endswith('\r\n'):
754 754 line = line[:-2] + '\n'
755 755 nlines.append(line)
756 756 return nlines
757 757
758 758 # Dummy object, it is rebuilt manually
759 759 nh = hunk(self.desc, self.number, None, None, False, False)
760 760 nh.number = self.number
761 761 nh.desc = self.desc
762 762 nh.hunk = self.hunk
763 763 nh.a = normalize(self.a)
764 764 nh.b = normalize(self.b)
765 765 nh.starta = self.starta
766 766 nh.startb = self.startb
767 767 nh.lena = self.lena
768 768 nh.lenb = self.lenb
769 769 nh.create = self.create
770 770 nh.remove = self.remove
771 771 return nh
772 772
773 773 def read_unified_hunk(self, lr):
774 774 m = unidesc.match(self.desc)
775 775 if not m:
776 776 raise PatchError(_("bad hunk #%d") % self.number)
777 777 self.starta, foo, self.lena, self.startb, foo2, self.lenb = m.groups()
778 778 if self.lena is None:
779 779 self.lena = 1
780 780 else:
781 781 self.lena = int(self.lena)
782 782 if self.lenb is None:
783 783 self.lenb = 1
784 784 else:
785 785 self.lenb = int(self.lenb)
786 786 self.starta = int(self.starta)
787 787 self.startb = int(self.startb)
788 788 diffhelpers.addlines(lr, self.hunk, self.lena, self.lenb, self.a, self.b)
789 789 # if we hit eof before finishing out the hunk, the last line will
790 790 # be zero length. Lets try to fix it up.
791 791 while len(self.hunk[-1]) == 0:
792 792 del self.hunk[-1]
793 793 del self.a[-1]
794 794 del self.b[-1]
795 795 self.lena -= 1
796 796 self.lenb -= 1
797 797 self._fixnewline(lr)
798 798
799 799 def read_context_hunk(self, lr):
800 800 self.desc = lr.readline()
801 801 m = contextdesc.match(self.desc)
802 802 if not m:
803 803 raise PatchError(_("bad hunk #%d") % self.number)
804 804 foo, self.starta, foo2, aend, foo3 = m.groups()
805 805 self.starta = int(self.starta)
806 806 if aend is None:
807 807 aend = self.starta
808 808 self.lena = int(aend) - self.starta
809 809 if self.starta:
810 810 self.lena += 1
811 811 for x in xrange(self.lena):
812 812 l = lr.readline()
813 813 if l.startswith('---'):
814 814 # lines addition, old block is empty
815 815 lr.push(l)
816 816 break
817 817 s = l[2:]
818 818 if l.startswith('- ') or l.startswith('! '):
819 819 u = '-' + s
820 820 elif l.startswith(' '):
821 821 u = ' ' + s
822 822 else:
823 823 raise PatchError(_("bad hunk #%d old text line %d") %
824 824 (self.number, x))
825 825 self.a.append(u)
826 826 self.hunk.append(u)
827 827
828 828 l = lr.readline()
829 829 if l.startswith('\ '):
830 830 s = self.a[-1][:-1]
831 831 self.a[-1] = s
832 832 self.hunk[-1] = s
833 833 l = lr.readline()
834 834 m = contextdesc.match(l)
835 835 if not m:
836 836 raise PatchError(_("bad hunk #%d") % self.number)
837 837 foo, self.startb, foo2, bend, foo3 = m.groups()
838 838 self.startb = int(self.startb)
839 839 if bend is None:
840 840 bend = self.startb
841 841 self.lenb = int(bend) - self.startb
842 842 if self.startb:
843 843 self.lenb += 1
844 844 hunki = 1
845 845 for x in xrange(self.lenb):
846 846 l = lr.readline()
847 847 if l.startswith('\ '):
848 848 # XXX: the only way to hit this is with an invalid line range.
849 849 # The no-eol marker is not counted in the line range, but I
850 850 # guess there are diff(1) out there which behave differently.
851 851 s = self.b[-1][:-1]
852 852 self.b[-1] = s
853 853 self.hunk[hunki - 1] = s
854 854 continue
855 855 if not l:
856 856 # line deletions, new block is empty and we hit EOF
857 857 lr.push(l)
858 858 break
859 859 s = l[2:]
860 860 if l.startswith('+ ') or l.startswith('! '):
861 861 u = '+' + s
862 862 elif l.startswith(' '):
863 863 u = ' ' + s
864 864 elif len(self.b) == 0:
865 865 # line deletions, new block is empty
866 866 lr.push(l)
867 867 break
868 868 else:
869 869 raise PatchError(_("bad hunk #%d old text line %d") %
870 870 (self.number, x))
871 871 self.b.append(s)
872 872 while True:
873 873 if hunki >= len(self.hunk):
874 874 h = ""
875 875 else:
876 876 h = self.hunk[hunki]
877 877 hunki += 1
878 878 if h == u:
879 879 break
880 880 elif h.startswith('-'):
881 881 continue
882 882 else:
883 883 self.hunk.insert(hunki - 1, u)
884 884 break
885 885
886 886 if not self.a:
887 887 # this happens when lines were only added to the hunk
888 888 for x in self.hunk:
889 889 if x.startswith('-') or x.startswith(' '):
890 890 self.a.append(x)
891 891 if not self.b:
892 892 # this happens when lines were only deleted from the hunk
893 893 for x in self.hunk:
894 894 if x.startswith('+') or x.startswith(' '):
895 895 self.b.append(x[1:])
896 896 # @@ -start,len +start,len @@
897 897 self.desc = "@@ -%d,%d +%d,%d @@\n" % (self.starta, self.lena,
898 898 self.startb, self.lenb)
899 899 self.hunk[0] = self.desc
900 900 self._fixnewline(lr)
901 901
902 902 def _fixnewline(self, lr):
903 903 l = lr.readline()
904 904 if l.startswith('\ '):
905 905 diffhelpers.fix_newline(self.hunk, self.a, self.b)
906 906 else:
907 907 lr.push(l)
908 908
909 909 def complete(self):
910 910 return len(self.a) == self.lena and len(self.b) == self.lenb
911 911
912 912 def createfile(self):
913 913 return self.starta == 0 and self.lena == 0 and self.create
914 914
915 915 def rmfile(self):
916 916 return self.startb == 0 and self.lenb == 0 and self.remove
917 917
918 918 def fuzzit(self, l, fuzz, toponly):
919 919 # this removes context lines from the top and bottom of list 'l'. It
920 920 # checks the hunk to make sure only context lines are removed, and then
921 921 # returns a new shortened list of lines.
922 922 fuzz = min(fuzz, len(l)-1)
923 923 if fuzz:
924 924 top = 0
925 925 bot = 0
926 926 hlen = len(self.hunk)
927 927 for x in xrange(hlen - 1):
928 928 # the hunk starts with the @@ line, so use x+1
929 929 if self.hunk[x + 1][0] == ' ':
930 930 top += 1
931 931 else:
932 932 break
933 933 if not toponly:
934 934 for x in xrange(hlen - 1):
935 935 if self.hunk[hlen - bot - 1][0] == ' ':
936 936 bot += 1
937 937 else:
938 938 break
939 939
940 940 # top and bot now count context in the hunk
941 941 # adjust them if either one is short
942 942 context = max(top, bot, 3)
943 943 if bot < context:
944 944 bot = max(0, fuzz - (context - bot))
945 945 else:
946 946 bot = min(fuzz, bot)
947 947 if top < context:
948 948 top = max(0, fuzz - (context - top))
949 949 else:
950 950 top = min(fuzz, top)
951 951
952 952 return l[top:len(l)-bot]
953 953 return l
954 954
955 955 def old(self, fuzz=0, toponly=False):
956 956 return self.fuzzit(self.a, fuzz, toponly)
957 957
958 958 def new(self, fuzz=0, toponly=False):
959 959 return self.fuzzit(self.b, fuzz, toponly)
960 960
961 961 class binhunk:
962 962 'A binary patch file. Only understands literals so far.'
963 963 def __init__(self, gitpatch):
964 964 self.gitpatch = gitpatch
965 965 self.text = None
966 966 self.hunk = ['GIT binary patch\n']
967 967
968 968 def createfile(self):
969 969 return self.gitpatch.op == 'ADD'
970 970
971 971 def rmfile(self):
972 972 return self.gitpatch.op == 'DELETE'
973 973
974 974 def complete(self):
975 975 return self.text is not None
976 976
977 977 def new(self):
978 978 return [self.text]
979 979
980 980 def extract(self, lr):
981 981 line = lr.readline()
982 982 self.hunk.append(line)
983 983 while line and not line.startswith('literal '):
984 984 line = lr.readline()
985 985 self.hunk.append(line)
986 986 if not line:
987 987 raise PatchError(_('could not extract binary patch'))
988 988 size = int(line[8:].rstrip())
989 989 dec = []
990 990 line = lr.readline()
991 991 self.hunk.append(line)
992 992 while len(line) > 1:
993 993 l = line[0]
994 994 if l <= 'Z' and l >= 'A':
995 995 l = ord(l) - ord('A') + 1
996 996 else:
997 997 l = ord(l) - ord('a') + 27
998 998 dec.append(base85.b85decode(line[1:-1])[:l])
999 999 line = lr.readline()
1000 1000 self.hunk.append(line)
1001 1001 text = zlib.decompress(''.join(dec))
1002 1002 if len(text) != size:
1003 1003 raise PatchError(_('binary patch is %d bytes, not %d') %
1004 1004 len(text), size)
1005 1005 self.text = text
1006 1006
1007 1007 def parsefilename(str):
1008 1008 # --- filename \t|space stuff
1009 1009 s = str[4:].rstrip('\r\n')
1010 1010 i = s.find('\t')
1011 1011 if i < 0:
1012 1012 i = s.find(' ')
1013 1013 if i < 0:
1014 1014 return s
1015 1015 return s[:i]
1016 1016
1017 1017 def pathstrip(path, strip):
1018 1018 pathlen = len(path)
1019 1019 i = 0
1020 1020 if strip == 0:
1021 1021 return '', path.rstrip()
1022 1022 count = strip
1023 1023 while count > 0:
1024 1024 i = path.find('/', i)
1025 1025 if i == -1:
1026 1026 raise PatchError(_("unable to strip away %d of %d dirs from %s") %
1027 1027 (count, strip, path))
1028 1028 i += 1
1029 1029 # consume '//' in the path
1030 1030 while i < pathlen - 1 and path[i] == '/':
1031 1031 i += 1
1032 1032 count -= 1
1033 1033 return path[:i].lstrip(), path[i:].rstrip()
1034 1034
1035 1035 def selectfile(backend, afile_orig, bfile_orig, hunk, strip):
1036 1036 nulla = afile_orig == "/dev/null"
1037 1037 nullb = bfile_orig == "/dev/null"
1038 1038 abase, afile = pathstrip(afile_orig, strip)
1039 1039 gooda = not nulla and backend.exists(afile)
1040 1040 bbase, bfile = pathstrip(bfile_orig, strip)
1041 1041 if afile == bfile:
1042 1042 goodb = gooda
1043 1043 else:
1044 1044 goodb = not nullb and backend.exists(bfile)
1045 1045 createfunc = hunk.createfile
1046 1046 missing = not goodb and not gooda and not createfunc()
1047 1047
1048 1048 # some diff programs apparently produce patches where the afile is
1049 1049 # not /dev/null, but afile starts with bfile
1050 1050 abasedir = afile[:afile.rfind('/') + 1]
1051 1051 bbasedir = bfile[:bfile.rfind('/') + 1]
1052 1052 if missing and abasedir == bbasedir and afile.startswith(bfile):
1053 1053 # this isn't very pretty
1054 1054 hunk.create = True
1055 1055 if createfunc():
1056 1056 missing = False
1057 1057 else:
1058 1058 hunk.create = False
1059 1059
1060 1060 # If afile is "a/b/foo" and bfile is "a/b/foo.orig" we assume the
1061 1061 # diff is between a file and its backup. In this case, the original
1062 1062 # file should be patched (see original mpatch code).
1063 1063 isbackup = (abase == bbase and bfile.startswith(afile))
1064 1064 fname = None
1065 1065 if not missing:
1066 1066 if gooda and goodb:
1067 1067 fname = isbackup and afile or bfile
1068 1068 elif gooda:
1069 1069 fname = afile
1070 1070
1071 1071 if not fname:
1072 1072 if not nullb:
1073 1073 fname = isbackup and afile or bfile
1074 1074 elif not nulla:
1075 1075 fname = afile
1076 1076 else:
1077 1077 raise PatchError(_("undefined source and destination files"))
1078 1078
1079 1079 return fname, missing
1080 1080
1081 1081 def scangitpatch(lr, firstline):
1082 1082 """
1083 1083 Git patches can emit:
1084 1084 - rename a to b
1085 1085 - change b
1086 1086 - copy a to c
1087 1087 - change c
1088 1088
1089 1089 We cannot apply this sequence as-is, the renamed 'a' could not be
1090 1090 found for it would have been renamed already. And we cannot copy
1091 1091 from 'b' instead because 'b' would have been changed already. So
1092 1092 we scan the git patch for copy and rename commands so we can
1093 1093 perform the copies ahead of time.
1094 1094 """
1095 1095 pos = 0
1096 1096 try:
1097 1097 pos = lr.fp.tell()
1098 1098 fp = lr.fp
1099 1099 except IOError:
1100 1100 fp = cStringIO.StringIO(lr.fp.read())
1101 1101 gitlr = linereader(fp, lr.textmode)
1102 1102 gitlr.push(firstline)
1103 1103 gitpatches = readgitpatch(gitlr)
1104 1104 fp.seek(pos)
1105 1105 return gitpatches
1106 1106
1107 1107 def iterhunks(fp):
1108 1108 """Read a patch and yield the following events:
1109 1109 - ("file", afile, bfile, firsthunk): select a new target file.
1110 1110 - ("hunk", hunk): a new hunk is ready to be applied, follows a
1111 1111 "file" event.
1112 1112 - ("git", gitchanges): current diff is in git format, gitchanges
1113 1113 maps filenames to gitpatch records. Unique event.
1114 1114 """
1115 1115 changed = {}
1116 1116 afile = ""
1117 1117 bfile = ""
1118 1118 state = None
1119 1119 hunknum = 0
1120 1120 emitfile = newfile = False
1121 1121 git = False
1122 1122
1123 1123 # our states
1124 1124 BFILE = 1
1125 1125 context = None
1126 1126 lr = linereader(fp)
1127 1127
1128 1128 while True:
1129 1129 x = lr.readline()
1130 1130 if not x:
1131 1131 break
1132 if (state == BFILE and ((not context and x[0] == '@') or
1133 ((context is not False) and x.startswith('***************')))):
1134 if context is None and x.startswith('***************'):
1135 context = True
1136 gpatch = changed.get(bfile)
1137 create = afile == '/dev/null' or gpatch and gpatch.op == 'ADD'
1138 remove = bfile == '/dev/null' or gpatch and gpatch.op == 'DELETE'
1139 h = hunk(x, hunknum + 1, lr, context, create, remove)
1132 if state == BFILE and (
1133 (not context and x[0] == '@')
1134 or (context is not False and x.startswith('***************'))
1135 or x.startswith('GIT binary patch')):
1136 gp = changed.get(bfile)
1137 if x.startswith('GIT binary patch'):
1138 h = binhunk(gp)
1139 h.extract(lr)
1140 afile = 'a/' + afile
1141 bfile = 'b/' + bfile
1142 else:
1143 if context is None and x.startswith('***************'):
1144 context = True
1145 create = afile == '/dev/null' or gp and gp.op == 'ADD'
1146 remove = bfile == '/dev/null' or gp and gp.op == 'DELETE'
1147 h = hunk(x, hunknum + 1, lr, context, create, remove)
1140 1148 hunknum += 1
1141 1149 if emitfile:
1142 1150 emitfile = False
1143 yield 'file', (afile, bfile, h, gpatch and gpatch.mode or None)
1144 yield 'hunk', h
1145 elif state == BFILE and x.startswith('GIT binary patch'):
1146 gpatch = changed[bfile]
1147 h = binhunk(gpatch)
1148 hunknum += 1
1149 if emitfile:
1150 emitfile = False
1151 yield 'file', ('a/' + afile, 'b/' + bfile, h,
1152 gpatch and gpatch.mode or None)
1153 h.extract(lr)
1151 yield 'file', (afile, bfile, h, gp and gp.mode or None)
1154 1152 yield 'hunk', h
1155 1153 elif x.startswith('diff --git'):
1156 1154 # check for git diff, scanning the whole patch file if needed
1157 1155 m = gitre.match(x)
1158 1156 if m:
1159 1157 afile, bfile = m.group(1, 2)
1160 1158 if not git:
1161 1159 git = True
1162 1160 gitpatches = scangitpatch(lr, x)
1163 1161 yield 'git', gitpatches
1164 1162 for gp in gitpatches:
1165 1163 changed[gp.path] = gp
1166 1164 # else error?
1167 1165 # copy/rename + modify should modify target, not source
1168 1166 gp = changed.get(bfile)
1169 1167 if gp and (gp.op in ('COPY', 'DELETE', 'RENAME', 'ADD')
1170 1168 or gp.mode):
1171 1169 afile = bfile
1172 1170 newfile = True
1173 1171 elif x.startswith('---'):
1174 1172 # check for a unified diff
1175 1173 l2 = lr.readline()
1176 1174 if not l2.startswith('+++'):
1177 1175 lr.push(l2)
1178 1176 continue
1179 1177 newfile = True
1180 1178 context = False
1181 1179 afile = parsefilename(x)
1182 1180 bfile = parsefilename(l2)
1183 1181 elif x.startswith('***'):
1184 1182 # check for a context diff
1185 1183 l2 = lr.readline()
1186 1184 if not l2.startswith('---'):
1187 1185 lr.push(l2)
1188 1186 continue
1189 1187 l3 = lr.readline()
1190 1188 lr.push(l3)
1191 1189 if not l3.startswith("***************"):
1192 1190 lr.push(l2)
1193 1191 continue
1194 1192 newfile = True
1195 1193 context = True
1196 1194 afile = parsefilename(x)
1197 1195 bfile = parsefilename(l2)
1198 1196
1199 1197 if newfile:
1200 1198 newfile = False
1201 1199 emitfile = True
1202 1200 state = BFILE
1203 1201 hunknum = 0
1204 1202
1205 1203 def applydiff(ui, fp, changed, backend, strip=1, eolmode='strict'):
1206 1204 """Reads a patch from fp and tries to apply it.
1207 1205
1208 1206 The dict 'changed' is filled in with all of the filenames changed
1209 1207 by the patch. Returns 0 for a clean patch, -1 if any rejects were
1210 1208 found and 1 if there was any fuzz.
1211 1209
1212 1210 If 'eolmode' is 'strict', the patch content and patched file are
1213 1211 read in binary mode. Otherwise, line endings are ignored when
1214 1212 patching then normalized according to 'eolmode'.
1215 1213 """
1216 1214 return _applydiff(ui, fp, patchfile, backend, changed, strip=strip,
1217 1215 eolmode=eolmode)
1218 1216
1219 1217 def _applydiff(ui, fp, patcher, backend, changed, strip=1, eolmode='strict'):
1220 1218 rejects = 0
1221 1219 err = 0
1222 1220 current_file = None
1223 1221
1224 1222 for state, values in iterhunks(fp):
1225 1223 if state == 'hunk':
1226 1224 if not current_file:
1227 1225 continue
1228 1226 ret = current_file.apply(values)
1229 1227 if ret >= 0:
1230 1228 changed.setdefault(current_file.fname, None)
1231 1229 if ret > 0:
1232 1230 err = 1
1233 1231 elif state == 'file':
1234 1232 if current_file:
1235 1233 rejects += current_file.close()
1236 1234 afile, bfile, first_hunk, mode = values
1237 1235 try:
1238 1236 current_file, missing = selectfile(backend, afile, bfile,
1239 1237 first_hunk, strip)
1240 1238 current_file = patcher(ui, current_file, backend, mode,
1241 1239 missing=missing, eolmode=eolmode)
1242 1240 except PatchError, inst:
1243 1241 ui.warn(str(inst) + '\n')
1244 1242 current_file = None
1245 1243 rejects += 1
1246 1244 continue
1247 1245 elif state == 'git':
1248 1246 for gp in values:
1249 1247 gp.path = pathstrip(gp.path, strip - 1)[1]
1250 1248 if gp.oldpath:
1251 1249 gp.oldpath = pathstrip(gp.oldpath, strip - 1)[1]
1252 1250 if gp.op in ('COPY', 'RENAME'):
1253 1251 backend.copy(gp.oldpath, gp.path)
1254 1252 changed[gp.path] = gp
1255 1253 else:
1256 1254 raise util.Abort(_('unsupported parser state: %s') % state)
1257 1255
1258 1256 if current_file:
1259 1257 rejects += current_file.close()
1260 1258
1261 1259 # Handle mode changes without hunk
1262 1260 removed = set()
1263 1261 for gp in changed.itervalues():
1264 1262 if not gp:
1265 1263 continue
1266 1264 if gp.op == 'DELETE':
1267 1265 removed.add(gp.path)
1268 1266 continue
1269 1267 if gp.op == 'RENAME':
1270 1268 removed.add(gp.oldpath)
1271 1269 if gp.mode:
1272 1270 if gp.op == 'ADD' and not backend.exists(gp.path):
1273 1271 # Added files without content have no hunk and must be created
1274 1272 backend.writelines(gp.path, [], gp.mode)
1275 1273 else:
1276 1274 backend.setmode(gp.path, gp.mode[0], gp.mode[1])
1277 1275 for path in sorted(removed):
1278 1276 backend.unlink(path)
1279 1277
1280 1278 if rejects:
1281 1279 return -1
1282 1280 return err
1283 1281
1284 1282 def _externalpatch(ui, repo, patcher, patchname, strip, files,
1285 1283 similarity):
1286 1284 """use <patcher> to apply <patchname> to the working directory.
1287 1285 returns whether patch was applied with fuzz factor."""
1288 1286
1289 1287 fuzz = False
1290 1288 args = []
1291 1289 cwd = repo.root
1292 1290 if cwd:
1293 1291 args.append('-d %s' % util.shellquote(cwd))
1294 1292 fp = util.popen('%s %s -p%d < %s' % (patcher, ' '.join(args), strip,
1295 1293 util.shellquote(patchname)))
1296 1294 try:
1297 1295 for line in fp:
1298 1296 line = line.rstrip()
1299 1297 ui.note(line + '\n')
1300 1298 if line.startswith('patching file '):
1301 1299 pf = util.parsepatchoutput(line)
1302 1300 printed_file = False
1303 1301 files.setdefault(pf, None)
1304 1302 elif line.find('with fuzz') >= 0:
1305 1303 fuzz = True
1306 1304 if not printed_file:
1307 1305 ui.warn(pf + '\n')
1308 1306 printed_file = True
1309 1307 ui.warn(line + '\n')
1310 1308 elif line.find('saving rejects to file') >= 0:
1311 1309 ui.warn(line + '\n')
1312 1310 elif line.find('FAILED') >= 0:
1313 1311 if not printed_file:
1314 1312 ui.warn(pf + '\n')
1315 1313 printed_file = True
1316 1314 ui.warn(line + '\n')
1317 1315 finally:
1318 1316 if files:
1319 1317 cfiles = list(files)
1320 1318 cwd = repo.getcwd()
1321 1319 if cwd:
1322 1320 cfiles = [util.pathto(repo.root, cwd, f)
1323 1321 for f in cfile]
1324 1322 scmutil.addremove(repo, cfiles, similarity=similarity)
1325 1323 code = fp.close()
1326 1324 if code:
1327 1325 raise PatchError(_("patch command failed: %s") %
1328 1326 util.explainexit(code)[0])
1329 1327 return fuzz
1330 1328
1331 1329 def internalpatch(ui, repo, patchobj, strip, files=None, eolmode='strict',
1332 1330 similarity=0):
1333 1331 """use builtin patch to apply <patchobj> to the working directory.
1334 1332 returns whether patch was applied with fuzz factor."""
1335 1333
1336 1334 if files is None:
1337 1335 files = {}
1338 1336 if eolmode is None:
1339 1337 eolmode = ui.config('patch', 'eol', 'strict')
1340 1338 if eolmode.lower() not in eolmodes:
1341 1339 raise util.Abort(_('unsupported line endings type: %s') % eolmode)
1342 1340 eolmode = eolmode.lower()
1343 1341
1344 1342 backend = workingbackend(ui, repo, similarity)
1345 1343 try:
1346 1344 fp = open(patchobj, 'rb')
1347 1345 except TypeError:
1348 1346 fp = patchobj
1349 1347 try:
1350 1348 ret = applydiff(ui, fp, files, backend, strip=strip, eolmode=eolmode)
1351 1349 finally:
1352 1350 if fp != patchobj:
1353 1351 fp.close()
1354 1352 files.update(dict.fromkeys(backend.close()))
1355 1353 if ret < 0:
1356 1354 raise PatchError(_('patch failed to apply'))
1357 1355 return ret > 0
1358 1356
1359 1357 def patch(ui, repo, patchname, strip=1, files=None, eolmode='strict',
1360 1358 similarity=0):
1361 1359 """Apply <patchname> to the working directory.
1362 1360
1363 1361 'eolmode' specifies how end of lines should be handled. It can be:
1364 1362 - 'strict': inputs are read in binary mode, EOLs are preserved
1365 1363 - 'crlf': EOLs are ignored when patching and reset to CRLF
1366 1364 - 'lf': EOLs are ignored when patching and reset to LF
1367 1365 - None: get it from user settings, default to 'strict'
1368 1366 'eolmode' is ignored when using an external patcher program.
1369 1367
1370 1368 Returns whether patch was applied with fuzz factor.
1371 1369 """
1372 1370 patcher = ui.config('ui', 'patch')
1373 1371 if files is None:
1374 1372 files = {}
1375 1373 try:
1376 1374 if patcher:
1377 1375 return _externalpatch(ui, repo, patcher, patchname, strip,
1378 1376 files, similarity)
1379 1377 return internalpatch(ui, repo, patchname, strip, files, eolmode,
1380 1378 similarity)
1381 1379 except PatchError, err:
1382 1380 raise util.Abort(str(err))
1383 1381
1384 1382 def changedfiles(ui, repo, patchpath, strip=1):
1385 1383 backend = fsbackend(ui, repo.root)
1386 1384 fp = open(patchpath, 'rb')
1387 1385 try:
1388 1386 changed = set()
1389 1387 for state, values in iterhunks(fp):
1390 1388 if state == 'hunk':
1391 1389 continue
1392 1390 elif state == 'file':
1393 1391 afile, bfile, first_hunk, mode = values
1394 1392 current_file, missing = selectfile(backend, afile, bfile,
1395 1393 first_hunk, strip)
1396 1394 changed.add(current_file)
1397 1395 elif state == 'git':
1398 1396 for gp in values:
1399 1397 gp.path = pathstrip(gp.path, strip - 1)[1]
1400 1398 changed.add(gp.path)
1401 1399 if gp.oldpath:
1402 1400 gp.oldpath = pathstrip(gp.oldpath, strip - 1)[1]
1403 1401 if gp.op == 'RENAME':
1404 1402 changed.add(gp.oldpath)
1405 1403 else:
1406 1404 raise util.Abort(_('unsupported parser state: %s') % state)
1407 1405 return changed
1408 1406 finally:
1409 1407 fp.close()
1410 1408
1411 1409 def b85diff(to, tn):
1412 1410 '''print base85-encoded binary diff'''
1413 1411 def gitindex(text):
1414 1412 if not text:
1415 1413 return hex(nullid)
1416 1414 l = len(text)
1417 1415 s = util.sha1('blob %d\0' % l)
1418 1416 s.update(text)
1419 1417 return s.hexdigest()
1420 1418
1421 1419 def fmtline(line):
1422 1420 l = len(line)
1423 1421 if l <= 26:
1424 1422 l = chr(ord('A') + l - 1)
1425 1423 else:
1426 1424 l = chr(l - 26 + ord('a') - 1)
1427 1425 return '%c%s\n' % (l, base85.b85encode(line, True))
1428 1426
1429 1427 def chunk(text, csize=52):
1430 1428 l = len(text)
1431 1429 i = 0
1432 1430 while i < l:
1433 1431 yield text[i:i + csize]
1434 1432 i += csize
1435 1433
1436 1434 tohash = gitindex(to)
1437 1435 tnhash = gitindex(tn)
1438 1436 if tohash == tnhash:
1439 1437 return ""
1440 1438
1441 1439 # TODO: deltas
1442 1440 ret = ['index %s..%s\nGIT binary patch\nliteral %s\n' %
1443 1441 (tohash, tnhash, len(tn))]
1444 1442 for l in chunk(zlib.compress(tn)):
1445 1443 ret.append(fmtline(l))
1446 1444 ret.append('\n')
1447 1445 return ''.join(ret)
1448 1446
1449 1447 class GitDiffRequired(Exception):
1450 1448 pass
1451 1449
1452 1450 def diffopts(ui, opts=None, untrusted=False):
1453 1451 def get(key, name=None, getter=ui.configbool):
1454 1452 return ((opts and opts.get(key)) or
1455 1453 getter('diff', name or key, None, untrusted=untrusted))
1456 1454 return mdiff.diffopts(
1457 1455 text=opts and opts.get('text'),
1458 1456 git=get('git'),
1459 1457 nodates=get('nodates'),
1460 1458 showfunc=get('show_function', 'showfunc'),
1461 1459 ignorews=get('ignore_all_space', 'ignorews'),
1462 1460 ignorewsamount=get('ignore_space_change', 'ignorewsamount'),
1463 1461 ignoreblanklines=get('ignore_blank_lines', 'ignoreblanklines'),
1464 1462 context=get('unified', getter=ui.config))
1465 1463
1466 1464 def diff(repo, node1=None, node2=None, match=None, changes=None, opts=None,
1467 1465 losedatafn=None, prefix=''):
1468 1466 '''yields diff of changes to files between two nodes, or node and
1469 1467 working directory.
1470 1468
1471 1469 if node1 is None, use first dirstate parent instead.
1472 1470 if node2 is None, compare node1 with working directory.
1473 1471
1474 1472 losedatafn(**kwarg) is a callable run when opts.upgrade=True and
1475 1473 every time some change cannot be represented with the current
1476 1474 patch format. Return False to upgrade to git patch format, True to
1477 1475 accept the loss or raise an exception to abort the diff. It is
1478 1476 called with the name of current file being diffed as 'fn'. If set
1479 1477 to None, patches will always be upgraded to git format when
1480 1478 necessary.
1481 1479
1482 1480 prefix is a filename prefix that is prepended to all filenames on
1483 1481 display (used for subrepos).
1484 1482 '''
1485 1483
1486 1484 if opts is None:
1487 1485 opts = mdiff.defaultopts
1488 1486
1489 1487 if not node1 and not node2:
1490 1488 node1 = repo.dirstate.p1()
1491 1489
1492 1490 def lrugetfilectx():
1493 1491 cache = {}
1494 1492 order = []
1495 1493 def getfilectx(f, ctx):
1496 1494 fctx = ctx.filectx(f, filelog=cache.get(f))
1497 1495 if f not in cache:
1498 1496 if len(cache) > 20:
1499 1497 del cache[order.pop(0)]
1500 1498 cache[f] = fctx.filelog()
1501 1499 else:
1502 1500 order.remove(f)
1503 1501 order.append(f)
1504 1502 return fctx
1505 1503 return getfilectx
1506 1504 getfilectx = lrugetfilectx()
1507 1505
1508 1506 ctx1 = repo[node1]
1509 1507 ctx2 = repo[node2]
1510 1508
1511 1509 if not changes:
1512 1510 changes = repo.status(ctx1, ctx2, match=match)
1513 1511 modified, added, removed = changes[:3]
1514 1512
1515 1513 if not modified and not added and not removed:
1516 1514 return []
1517 1515
1518 1516 revs = None
1519 1517 if not repo.ui.quiet:
1520 1518 hexfunc = repo.ui.debugflag and hex or short
1521 1519 revs = [hexfunc(node) for node in [node1, node2] if node]
1522 1520
1523 1521 copy = {}
1524 1522 if opts.git or opts.upgrade:
1525 1523 copy = copies.copies(repo, ctx1, ctx2, repo[nullid])[0]
1526 1524
1527 1525 difffn = lambda opts, losedata: trydiff(repo, revs, ctx1, ctx2,
1528 1526 modified, added, removed, copy, getfilectx, opts, losedata, prefix)
1529 1527 if opts.upgrade and not opts.git:
1530 1528 try:
1531 1529 def losedata(fn):
1532 1530 if not losedatafn or not losedatafn(fn=fn):
1533 1531 raise GitDiffRequired()
1534 1532 # Buffer the whole output until we are sure it can be generated
1535 1533 return list(difffn(opts.copy(git=False), losedata))
1536 1534 except GitDiffRequired:
1537 1535 return difffn(opts.copy(git=True), None)
1538 1536 else:
1539 1537 return difffn(opts, None)
1540 1538
1541 1539 def difflabel(func, *args, **kw):
1542 1540 '''yields 2-tuples of (output, label) based on the output of func()'''
1543 1541 prefixes = [('diff', 'diff.diffline'),
1544 1542 ('copy', 'diff.extended'),
1545 1543 ('rename', 'diff.extended'),
1546 1544 ('old', 'diff.extended'),
1547 1545 ('new', 'diff.extended'),
1548 1546 ('deleted', 'diff.extended'),
1549 1547 ('---', 'diff.file_a'),
1550 1548 ('+++', 'diff.file_b'),
1551 1549 ('@@', 'diff.hunk'),
1552 1550 ('-', 'diff.deleted'),
1553 1551 ('+', 'diff.inserted')]
1554 1552
1555 1553 for chunk in func(*args, **kw):
1556 1554 lines = chunk.split('\n')
1557 1555 for i, line in enumerate(lines):
1558 1556 if i != 0:
1559 1557 yield ('\n', '')
1560 1558 stripline = line
1561 1559 if line and line[0] in '+-':
1562 1560 # highlight trailing whitespace, but only in changed lines
1563 1561 stripline = line.rstrip()
1564 1562 for prefix, label in prefixes:
1565 1563 if stripline.startswith(prefix):
1566 1564 yield (stripline, label)
1567 1565 break
1568 1566 else:
1569 1567 yield (line, '')
1570 1568 if line != stripline:
1571 1569 yield (line[len(stripline):], 'diff.trailingwhitespace')
1572 1570
1573 1571 def diffui(*args, **kw):
1574 1572 '''like diff(), but yields 2-tuples of (output, label) for ui.write()'''
1575 1573 return difflabel(diff, *args, **kw)
1576 1574
1577 1575
1578 1576 def _addmodehdr(header, omode, nmode):
1579 1577 if omode != nmode:
1580 1578 header.append('old mode %s\n' % omode)
1581 1579 header.append('new mode %s\n' % nmode)
1582 1580
1583 1581 def trydiff(repo, revs, ctx1, ctx2, modified, added, removed,
1584 1582 copy, getfilectx, opts, losedatafn, prefix):
1585 1583
1586 1584 def join(f):
1587 1585 return os.path.join(prefix, f)
1588 1586
1589 1587 date1 = util.datestr(ctx1.date())
1590 1588 man1 = ctx1.manifest()
1591 1589
1592 1590 gone = set()
1593 1591 gitmode = {'l': '120000', 'x': '100755', '': '100644'}
1594 1592
1595 1593 copyto = dict([(v, k) for k, v in copy.items()])
1596 1594
1597 1595 if opts.git:
1598 1596 revs = None
1599 1597
1600 1598 for f in sorted(modified + added + removed):
1601 1599 to = None
1602 1600 tn = None
1603 1601 dodiff = True
1604 1602 header = []
1605 1603 if f in man1:
1606 1604 to = getfilectx(f, ctx1).data()
1607 1605 if f not in removed:
1608 1606 tn = getfilectx(f, ctx2).data()
1609 1607 a, b = f, f
1610 1608 if opts.git or losedatafn:
1611 1609 if f in added:
1612 1610 mode = gitmode[ctx2.flags(f)]
1613 1611 if f in copy or f in copyto:
1614 1612 if opts.git:
1615 1613 if f in copy:
1616 1614 a = copy[f]
1617 1615 else:
1618 1616 a = copyto[f]
1619 1617 omode = gitmode[man1.flags(a)]
1620 1618 _addmodehdr(header, omode, mode)
1621 1619 if a in removed and a not in gone:
1622 1620 op = 'rename'
1623 1621 gone.add(a)
1624 1622 else:
1625 1623 op = 'copy'
1626 1624 header.append('%s from %s\n' % (op, join(a)))
1627 1625 header.append('%s to %s\n' % (op, join(f)))
1628 1626 to = getfilectx(a, ctx1).data()
1629 1627 else:
1630 1628 losedatafn(f)
1631 1629 else:
1632 1630 if opts.git:
1633 1631 header.append('new file mode %s\n' % mode)
1634 1632 elif ctx2.flags(f):
1635 1633 losedatafn(f)
1636 1634 # In theory, if tn was copied or renamed we should check
1637 1635 # if the source is binary too but the copy record already
1638 1636 # forces git mode.
1639 1637 if util.binary(tn):
1640 1638 if opts.git:
1641 1639 dodiff = 'binary'
1642 1640 else:
1643 1641 losedatafn(f)
1644 1642 if not opts.git and not tn:
1645 1643 # regular diffs cannot represent new empty file
1646 1644 losedatafn(f)
1647 1645 elif f in removed:
1648 1646 if opts.git:
1649 1647 # have we already reported a copy above?
1650 1648 if ((f in copy and copy[f] in added
1651 1649 and copyto[copy[f]] == f) or
1652 1650 (f in copyto and copyto[f] in added
1653 1651 and copy[copyto[f]] == f)):
1654 1652 dodiff = False
1655 1653 else:
1656 1654 header.append('deleted file mode %s\n' %
1657 1655 gitmode[man1.flags(f)])
1658 1656 elif not to or util.binary(to):
1659 1657 # regular diffs cannot represent empty file deletion
1660 1658 losedatafn(f)
1661 1659 else:
1662 1660 oflag = man1.flags(f)
1663 1661 nflag = ctx2.flags(f)
1664 1662 binary = util.binary(to) or util.binary(tn)
1665 1663 if opts.git:
1666 1664 _addmodehdr(header, gitmode[oflag], gitmode[nflag])
1667 1665 if binary:
1668 1666 dodiff = 'binary'
1669 1667 elif binary or nflag != oflag:
1670 1668 losedatafn(f)
1671 1669 if opts.git:
1672 1670 header.insert(0, mdiff.diffline(revs, join(a), join(b), opts))
1673 1671
1674 1672 if dodiff:
1675 1673 if dodiff == 'binary':
1676 1674 text = b85diff(to, tn)
1677 1675 else:
1678 1676 text = mdiff.unidiff(to, date1,
1679 1677 # ctx2 date may be dynamic
1680 1678 tn, util.datestr(ctx2.date()),
1681 1679 join(a), join(b), revs, opts=opts)
1682 1680 if header and (text or len(header) > 1):
1683 1681 yield ''.join(header)
1684 1682 if text:
1685 1683 yield text
1686 1684
1687 1685 def diffstatdata(lines):
1688 1686 diffre = re.compile('^diff .*-r [a-z0-9]+\s(.*)$')
1689 1687
1690 1688 filename, adds, removes = None, 0, 0
1691 1689 for line in lines:
1692 1690 if line.startswith('diff'):
1693 1691 if filename:
1694 1692 isbinary = adds == 0 and removes == 0
1695 1693 yield (filename, adds, removes, isbinary)
1696 1694 # set numbers to 0 anyway when starting new file
1697 1695 adds, removes = 0, 0
1698 1696 if line.startswith('diff --git'):
1699 1697 filename = gitre.search(line).group(1)
1700 1698 elif line.startswith('diff -r'):
1701 1699 # format: "diff -r ... -r ... filename"
1702 1700 filename = diffre.search(line).group(1)
1703 1701 elif line.startswith('+') and not line.startswith('+++'):
1704 1702 adds += 1
1705 1703 elif line.startswith('-') and not line.startswith('---'):
1706 1704 removes += 1
1707 1705 if filename:
1708 1706 isbinary = adds == 0 and removes == 0
1709 1707 yield (filename, adds, removes, isbinary)
1710 1708
1711 1709 def diffstat(lines, width=80, git=False):
1712 1710 output = []
1713 1711 stats = list(diffstatdata(lines))
1714 1712
1715 1713 maxtotal, maxname = 0, 0
1716 1714 totaladds, totalremoves = 0, 0
1717 1715 hasbinary = False
1718 1716
1719 1717 sized = [(filename, adds, removes, isbinary, encoding.colwidth(filename))
1720 1718 for filename, adds, removes, isbinary in stats]
1721 1719
1722 1720 for filename, adds, removes, isbinary, namewidth in sized:
1723 1721 totaladds += adds
1724 1722 totalremoves += removes
1725 1723 maxname = max(maxname, namewidth)
1726 1724 maxtotal = max(maxtotal, adds + removes)
1727 1725 if isbinary:
1728 1726 hasbinary = True
1729 1727
1730 1728 countwidth = len(str(maxtotal))
1731 1729 if hasbinary and countwidth < 3:
1732 1730 countwidth = 3
1733 1731 graphwidth = width - countwidth - maxname - 6
1734 1732 if graphwidth < 10:
1735 1733 graphwidth = 10
1736 1734
1737 1735 def scale(i):
1738 1736 if maxtotal <= graphwidth:
1739 1737 return i
1740 1738 # If diffstat runs out of room it doesn't print anything,
1741 1739 # which isn't very useful, so always print at least one + or -
1742 1740 # if there were at least some changes.
1743 1741 return max(i * graphwidth // maxtotal, int(bool(i)))
1744 1742
1745 1743 for filename, adds, removes, isbinary, namewidth in sized:
1746 1744 if git and isbinary:
1747 1745 count = 'Bin'
1748 1746 else:
1749 1747 count = adds + removes
1750 1748 pluses = '+' * scale(adds)
1751 1749 minuses = '-' * scale(removes)
1752 1750 output.append(' %s%s | %*s %s%s\n' %
1753 1751 (filename, ' ' * (maxname - namewidth),
1754 1752 countwidth, count,
1755 1753 pluses, minuses))
1756 1754
1757 1755 if stats:
1758 1756 output.append(_(' %d files changed, %d insertions(+), %d deletions(-)\n')
1759 1757 % (len(stats), totaladds, totalremoves))
1760 1758
1761 1759 return ''.join(output)
1762 1760
1763 1761 def diffstatui(*args, **kw):
1764 1762 '''like diffstat(), but yields 2-tuples of (output, label) for
1765 1763 ui.write()
1766 1764 '''
1767 1765
1768 1766 for line in diffstat(*args, **kw).splitlines():
1769 1767 if line and line[-1] in '+-':
1770 1768 name, graph = line.rsplit(' ', 1)
1771 1769 yield (name + ' ', '')
1772 1770 m = re.search(r'\++', graph)
1773 1771 if m:
1774 1772 yield (m.group(0), 'diffstat.inserted')
1775 1773 m = re.search(r'-+', graph)
1776 1774 if m:
1777 1775 yield (m.group(0), 'diffstat.deleted')
1778 1776 else:
1779 1777 yield (line, '')
1780 1778 yield ('\n', '')
General Comments 0
You need to be logged in to leave comments. Login now