##// END OF EJS Templates
patch: construct and parse binary hunks at the same time
Patrick Mezard -
r14384:9d59c596 default
parent child Browse files
Show More
@@ -1,1778 +1,1778 b''
1 1 # patch.py - patch file parsing routines
2 2 #
3 3 # Copyright 2006 Brendan Cully <brendan@kublai.com>
4 4 # Copyright 2007 Chris Mason <chris.mason@oracle.com>
5 5 #
6 6 # This software may be used and distributed according to the terms of the
7 7 # GNU General Public License version 2 or any later version.
8 8
9 9 import cStringIO, email.Parser, os, errno, re
10 10 import tempfile, zlib
11 11
12 12 from i18n import _
13 13 from node import hex, nullid, short
14 14 import base85, mdiff, scmutil, util, diffhelpers, copies, encoding
15 15
16 16 gitre = re.compile('diff --git a/(.*) b/(.*)')
17 17
18 18 class PatchError(Exception):
19 19 pass
20 20
21 21
22 22 # public functions
23 23
24 24 def split(stream):
25 25 '''return an iterator of individual patches from a stream'''
26 26 def isheader(line, inheader):
27 27 if inheader and line[0] in (' ', '\t'):
28 28 # continuation
29 29 return True
30 30 if line[0] in (' ', '-', '+'):
31 31 # diff line - don't check for header pattern in there
32 32 return False
33 33 l = line.split(': ', 1)
34 34 return len(l) == 2 and ' ' not in l[0]
35 35
36 36 def chunk(lines):
37 37 return cStringIO.StringIO(''.join(lines))
38 38
39 39 def hgsplit(stream, cur):
40 40 inheader = True
41 41
42 42 for line in stream:
43 43 if not line.strip():
44 44 inheader = False
45 45 if not inheader and line.startswith('# HG changeset patch'):
46 46 yield chunk(cur)
47 47 cur = []
48 48 inheader = True
49 49
50 50 cur.append(line)
51 51
52 52 if cur:
53 53 yield chunk(cur)
54 54
55 55 def mboxsplit(stream, cur):
56 56 for line in stream:
57 57 if line.startswith('From '):
58 58 for c in split(chunk(cur[1:])):
59 59 yield c
60 60 cur = []
61 61
62 62 cur.append(line)
63 63
64 64 if cur:
65 65 for c in split(chunk(cur[1:])):
66 66 yield c
67 67
68 68 def mimesplit(stream, cur):
69 69 def msgfp(m):
70 70 fp = cStringIO.StringIO()
71 71 g = email.Generator.Generator(fp, mangle_from_=False)
72 72 g.flatten(m)
73 73 fp.seek(0)
74 74 return fp
75 75
76 76 for line in stream:
77 77 cur.append(line)
78 78 c = chunk(cur)
79 79
80 80 m = email.Parser.Parser().parse(c)
81 81 if not m.is_multipart():
82 82 yield msgfp(m)
83 83 else:
84 84 ok_types = ('text/plain', 'text/x-diff', 'text/x-patch')
85 85 for part in m.walk():
86 86 ct = part.get_content_type()
87 87 if ct not in ok_types:
88 88 continue
89 89 yield msgfp(part)
90 90
91 91 def headersplit(stream, cur):
92 92 inheader = False
93 93
94 94 for line in stream:
95 95 if not inheader and isheader(line, inheader):
96 96 yield chunk(cur)
97 97 cur = []
98 98 inheader = True
99 99 if inheader and not isheader(line, inheader):
100 100 inheader = False
101 101
102 102 cur.append(line)
103 103
104 104 if cur:
105 105 yield chunk(cur)
106 106
107 107 def remainder(cur):
108 108 yield chunk(cur)
109 109
110 110 class fiter(object):
111 111 def __init__(self, fp):
112 112 self.fp = fp
113 113
114 114 def __iter__(self):
115 115 return self
116 116
117 117 def next(self):
118 118 l = self.fp.readline()
119 119 if not l:
120 120 raise StopIteration
121 121 return l
122 122
123 123 inheader = False
124 124 cur = []
125 125
126 126 mimeheaders = ['content-type']
127 127
128 128 if not hasattr(stream, 'next'):
129 129 # http responses, for example, have readline but not next
130 130 stream = fiter(stream)
131 131
132 132 for line in stream:
133 133 cur.append(line)
134 134 if line.startswith('# HG changeset patch'):
135 135 return hgsplit(stream, cur)
136 136 elif line.startswith('From '):
137 137 return mboxsplit(stream, cur)
138 138 elif isheader(line, inheader):
139 139 inheader = True
140 140 if line.split(':', 1)[0].lower() in mimeheaders:
141 141 # let email parser handle this
142 142 return mimesplit(stream, cur)
143 143 elif line.startswith('--- ') and inheader:
144 144 # No evil headers seen by diff start, split by hand
145 145 return headersplit(stream, cur)
146 146 # Not enough info, keep reading
147 147
148 148 # if we are here, we have a very plain patch
149 149 return remainder(cur)
150 150
151 151 def extract(ui, fileobj):
152 152 '''extract patch from data read from fileobj.
153 153
154 154 patch can be a normal patch or contained in an email message.
155 155
156 156 return tuple (filename, message, user, date, branch, node, p1, p2).
157 157 Any item in the returned tuple can be None. If filename is None,
158 158 fileobj did not contain a patch. Caller must unlink filename when done.'''
159 159
160 160 # attempt to detect the start of a patch
161 161 # (this heuristic is borrowed from quilt)
162 162 diffre = re.compile(r'^(?:Index:[ \t]|diff[ \t]|RCS file: |'
163 163 r'retrieving revision [0-9]+(\.[0-9]+)*$|'
164 164 r'---[ \t].*?^\+\+\+[ \t]|'
165 165 r'\*\*\*[ \t].*?^---[ \t])', re.MULTILINE|re.DOTALL)
166 166
167 167 fd, tmpname = tempfile.mkstemp(prefix='hg-patch-')
168 168 tmpfp = os.fdopen(fd, 'w')
169 169 try:
170 170 msg = email.Parser.Parser().parse(fileobj)
171 171
172 172 subject = msg['Subject']
173 173 user = msg['From']
174 174 if not subject and not user:
175 175 # Not an email, restore parsed headers if any
176 176 subject = '\n'.join(': '.join(h) for h in msg.items()) + '\n'
177 177
178 178 gitsendmail = 'git-send-email' in msg.get('X-Mailer', '')
179 179 # should try to parse msg['Date']
180 180 date = None
181 181 nodeid = None
182 182 branch = None
183 183 parents = []
184 184
185 185 if subject:
186 186 if subject.startswith('[PATCH'):
187 187 pend = subject.find(']')
188 188 if pend >= 0:
189 189 subject = subject[pend + 1:].lstrip()
190 190 subject = subject.replace('\n\t', ' ')
191 191 ui.debug('Subject: %s\n' % subject)
192 192 if user:
193 193 ui.debug('From: %s\n' % user)
194 194 diffs_seen = 0
195 195 ok_types = ('text/plain', 'text/x-diff', 'text/x-patch')
196 196 message = ''
197 197 for part in msg.walk():
198 198 content_type = part.get_content_type()
199 199 ui.debug('Content-Type: %s\n' % content_type)
200 200 if content_type not in ok_types:
201 201 continue
202 202 payload = part.get_payload(decode=True)
203 203 m = diffre.search(payload)
204 204 if m:
205 205 hgpatch = False
206 206 hgpatchheader = False
207 207 ignoretext = False
208 208
209 209 ui.debug('found patch at byte %d\n' % m.start(0))
210 210 diffs_seen += 1
211 211 cfp = cStringIO.StringIO()
212 212 for line in payload[:m.start(0)].splitlines():
213 213 if line.startswith('# HG changeset patch') and not hgpatch:
214 214 ui.debug('patch generated by hg export\n')
215 215 hgpatch = True
216 216 hgpatchheader = True
217 217 # drop earlier commit message content
218 218 cfp.seek(0)
219 219 cfp.truncate()
220 220 subject = None
221 221 elif hgpatchheader:
222 222 if line.startswith('# User '):
223 223 user = line[7:]
224 224 ui.debug('From: %s\n' % user)
225 225 elif line.startswith("# Date "):
226 226 date = line[7:]
227 227 elif line.startswith("# Branch "):
228 228 branch = line[9:]
229 229 elif line.startswith("# Node ID "):
230 230 nodeid = line[10:]
231 231 elif line.startswith("# Parent "):
232 232 parents.append(line[10:])
233 233 elif not line.startswith("# "):
234 234 hgpatchheader = False
235 235 elif line == '---' and gitsendmail:
236 236 ignoretext = True
237 237 if not hgpatchheader and not ignoretext:
238 238 cfp.write(line)
239 239 cfp.write('\n')
240 240 message = cfp.getvalue()
241 241 if tmpfp:
242 242 tmpfp.write(payload)
243 243 if not payload.endswith('\n'):
244 244 tmpfp.write('\n')
245 245 elif not diffs_seen and message and content_type == 'text/plain':
246 246 message += '\n' + payload
247 247 except:
248 248 tmpfp.close()
249 249 os.unlink(tmpname)
250 250 raise
251 251
252 252 if subject and not message.startswith(subject):
253 253 message = '%s\n%s' % (subject, message)
254 254 tmpfp.close()
255 255 if not diffs_seen:
256 256 os.unlink(tmpname)
257 257 return None, message, user, date, branch, None, None, None
258 258 p1 = parents and parents.pop(0) or None
259 259 p2 = parents and parents.pop(0) or None
260 260 return tmpname, message, user, date, branch, nodeid, p1, p2
261 261
262 262 class patchmeta(object):
263 263 """Patched file metadata
264 264
265 265 'op' is the performed operation within ADD, DELETE, RENAME, MODIFY
266 266 or COPY. 'path' is patched file path. 'oldpath' is set to the
267 267 origin file when 'op' is either COPY or RENAME, None otherwise. If
268 268 file mode is changed, 'mode' is a tuple (islink, isexec) where
269 269 'islink' is True if the file is a symlink and 'isexec' is True if
270 270 the file is executable. Otherwise, 'mode' is None.
271 271 """
272 272 def __init__(self, path):
273 273 self.path = path
274 274 self.oldpath = None
275 275 self.mode = None
276 276 self.op = 'MODIFY'
277 277 self.binary = False
278 278
279 279 def setmode(self, mode):
280 280 islink = mode & 020000
281 281 isexec = mode & 0100
282 282 self.mode = (islink, isexec)
283 283
284 284 def __repr__(self):
285 285 return "<patchmeta %s %r>" % (self.op, self.path)
286 286
287 287 def readgitpatch(lr):
288 288 """extract git-style metadata about patches from <patchname>"""
289 289
290 290 # Filter patch for git information
291 291 gp = None
292 292 gitpatches = []
293 293 for line in lr:
294 294 line = line.rstrip(' \r\n')
295 295 if line.startswith('diff --git'):
296 296 m = gitre.match(line)
297 297 if m:
298 298 if gp:
299 299 gitpatches.append(gp)
300 300 dst = m.group(2)
301 301 gp = patchmeta(dst)
302 302 elif gp:
303 303 if line.startswith('--- '):
304 304 gitpatches.append(gp)
305 305 gp = None
306 306 continue
307 307 if line.startswith('rename from '):
308 308 gp.op = 'RENAME'
309 309 gp.oldpath = line[12:]
310 310 elif line.startswith('rename to '):
311 311 gp.path = line[10:]
312 312 elif line.startswith('copy from '):
313 313 gp.op = 'COPY'
314 314 gp.oldpath = line[10:]
315 315 elif line.startswith('copy to '):
316 316 gp.path = line[8:]
317 317 elif line.startswith('deleted file'):
318 318 gp.op = 'DELETE'
319 319 elif line.startswith('new file mode '):
320 320 gp.op = 'ADD'
321 321 gp.setmode(int(line[-6:], 8))
322 322 elif line.startswith('new mode '):
323 323 gp.setmode(int(line[-6:], 8))
324 324 elif line.startswith('GIT binary patch'):
325 325 gp.binary = True
326 326 if gp:
327 327 gitpatches.append(gp)
328 328
329 329 return gitpatches
330 330
331 331 class linereader(object):
332 332 # simple class to allow pushing lines back into the input stream
333 333 def __init__(self, fp, textmode=False):
334 334 self.fp = fp
335 335 self.buf = []
336 336 self.textmode = textmode
337 337 self.eol = None
338 338
339 339 def push(self, line):
340 340 if line is not None:
341 341 self.buf.append(line)
342 342
343 343 def readline(self):
344 344 if self.buf:
345 345 l = self.buf[0]
346 346 del self.buf[0]
347 347 return l
348 348 l = self.fp.readline()
349 349 if not self.eol:
350 350 if l.endswith('\r\n'):
351 351 self.eol = '\r\n'
352 352 elif l.endswith('\n'):
353 353 self.eol = '\n'
354 354 if self.textmode and l.endswith('\r\n'):
355 355 l = l[:-2] + '\n'
356 356 return l
357 357
358 358 def __iter__(self):
359 359 while 1:
360 360 l = self.readline()
361 361 if not l:
362 362 break
363 363 yield l
364 364
365 365 class abstractbackend(object):
366 366 def __init__(self, ui):
367 367 self.ui = ui
368 368
369 369 def readlines(self, fname):
370 370 """Return target file lines, or its content as a single line
371 371 for symlinks.
372 372 """
373 373 raise NotImplementedError
374 374
375 375 def writelines(self, fname, lines, mode):
376 376 """Write lines to target file. mode is a (islink, isexec)
377 377 tuple, or None if there is no mode information.
378 378 """
379 379 raise NotImplementedError
380 380
381 381 def unlink(self, fname):
382 382 """Unlink target file."""
383 383 raise NotImplementedError
384 384
385 385 def writerej(self, fname, failed, total, lines):
386 386 """Write rejected lines for fname. total is the number of hunks
387 387 which failed to apply and total the total number of hunks for this
388 388 files.
389 389 """
390 390 pass
391 391
392 392 def copy(self, src, dst):
393 393 """Copy src file into dst file. Create intermediate directories if
394 394 necessary. Files are specified relatively to the patching base
395 395 directory.
396 396 """
397 397 raise NotImplementedError
398 398
399 399 def exists(self, fname):
400 400 raise NotImplementedError
401 401
402 402 def setmode(self, fname, islink, isexec):
403 403 """Change target file mode."""
404 404 raise NotImplementedError
405 405
406 406 class fsbackend(abstractbackend):
407 407 def __init__(self, ui, basedir):
408 408 super(fsbackend, self).__init__(ui)
409 409 self.opener = scmutil.opener(basedir)
410 410
411 411 def _join(self, f):
412 412 return os.path.join(self.opener.base, f)
413 413
414 414 def readlines(self, fname):
415 415 if os.path.islink(self._join(fname)):
416 416 return [os.readlink(self._join(fname))]
417 417 fp = self.opener(fname, 'r')
418 418 try:
419 419 return list(fp)
420 420 finally:
421 421 fp.close()
422 422
423 423 def writelines(self, fname, lines, mode):
424 424 if not mode:
425 425 # Preserve mode information
426 426 isexec, islink = False, False
427 427 try:
428 428 isexec = os.lstat(self._join(fname)).st_mode & 0100 != 0
429 429 islink = os.path.islink(self._join(fname))
430 430 except OSError, e:
431 431 if e.errno != errno.ENOENT:
432 432 raise
433 433 else:
434 434 islink, isexec = mode
435 435 if islink:
436 436 self.opener.symlink(''.join(lines), fname)
437 437 else:
438 438 self.opener(fname, 'w').writelines(lines)
439 439 if isexec:
440 440 util.setflags(self._join(fname), False, True)
441 441
442 442 def unlink(self, fname):
443 443 try:
444 444 util.unlinkpath(self._join(fname))
445 445 except OSError, inst:
446 446 if inst.errno != errno.ENOENT:
447 447 raise
448 448
449 449 def writerej(self, fname, failed, total, lines):
450 450 fname = fname + ".rej"
451 451 self.ui.warn(
452 452 _("%d out of %d hunks FAILED -- saving rejects to file %s\n") %
453 453 (failed, total, fname))
454 454 fp = self.opener(fname, 'w')
455 455 fp.writelines(lines)
456 456 fp.close()
457 457
458 458 def copy(self, src, dst):
459 459 basedir = self.opener.base
460 460 abssrc, absdst = [scmutil.canonpath(basedir, basedir, x)
461 461 for x in [src, dst]]
462 462 if os.path.lexists(absdst):
463 463 raise util.Abort(_("cannot create %s: destination already exists")
464 464 % dst)
465 465 dstdir = os.path.dirname(absdst)
466 466 if dstdir and not os.path.isdir(dstdir):
467 467 try:
468 468 os.makedirs(dstdir)
469 469 except IOError:
470 470 raise util.Abort(
471 471 _("cannot create %s: unable to create destination directory")
472 472 % dst)
473 473 util.copyfile(abssrc, absdst)
474 474
475 475 def exists(self, fname):
476 476 return os.path.lexists(self._join(fname))
477 477
478 478 def setmode(self, fname, islink, isexec):
479 479 util.setflags(self._join(fname), islink, isexec)
480 480
481 481 class workingbackend(fsbackend):
482 482 def __init__(self, ui, repo, similarity):
483 483 super(workingbackend, self).__init__(ui, repo.root)
484 484 self.repo = repo
485 485 self.similarity = similarity
486 486 self.removed = set()
487 487 self.changed = set()
488 488 self.copied = []
489 489
490 490 def writelines(self, fname, lines, mode):
491 491 super(workingbackend, self).writelines(fname, lines, mode)
492 492 self.changed.add(fname)
493 493
494 494 def unlink(self, fname):
495 495 super(workingbackend, self).unlink(fname)
496 496 self.removed.add(fname)
497 497 self.changed.add(fname)
498 498
499 499 def copy(self, src, dst):
500 500 super(workingbackend, self).copy(src, dst)
501 501 self.copied.append((src, dst))
502 502 self.changed.add(dst)
503 503
504 504 def setmode(self, fname, islink, isexec):
505 505 super(workingbackend, self).setmode(fname, islink, isexec)
506 506 self.changed.add(fname)
507 507
508 508 def close(self):
509 509 wctx = self.repo[None]
510 510 addremoved = set(self.changed)
511 511 for src, dst in self.copied:
512 512 scmutil.dirstatecopy(self.ui, self.repo, wctx, src, dst)
513 513 addremoved.discard(src)
514 514 if (not self.similarity) and self.removed:
515 515 wctx.remove(sorted(self.removed))
516 516 if addremoved:
517 517 cwd = self.repo.getcwd()
518 518 if cwd:
519 519 addremoved = [util.pathto(self.repo.root, cwd, f)
520 520 for f in addremoved]
521 521 scmutil.addremove(self.repo, addremoved, similarity=self.similarity)
522 522 return sorted(self.changed)
523 523
524 524 # @@ -start,len +start,len @@ or @@ -start +start @@ if len is 1
525 525 unidesc = re.compile('@@ -(\d+)(,(\d+))? \+(\d+)(,(\d+))? @@')
526 526 contextdesc = re.compile('(---|\*\*\*) (\d+)(,(\d+))? (---|\*\*\*)')
527 527 eolmodes = ['strict', 'crlf', 'lf', 'auto']
528 528
529 529 class patchfile(object):
530 530 def __init__(self, ui, fname, backend, mode, missing=False,
531 531 eolmode='strict'):
532 532 self.fname = fname
533 533 self.eolmode = eolmode
534 534 self.eol = None
535 535 self.backend = backend
536 536 self.ui = ui
537 537 self.lines = []
538 538 self.exists = False
539 539 self.missing = missing
540 540 self.mode = mode
541 541 if not missing:
542 542 try:
543 543 self.lines = self.backend.readlines(fname)
544 544 if self.lines:
545 545 # Normalize line endings
546 546 if self.lines[0].endswith('\r\n'):
547 547 self.eol = '\r\n'
548 548 elif self.lines[0].endswith('\n'):
549 549 self.eol = '\n'
550 550 if eolmode != 'strict':
551 551 nlines = []
552 552 for l in self.lines:
553 553 if l.endswith('\r\n'):
554 554 l = l[:-2] + '\n'
555 555 nlines.append(l)
556 556 self.lines = nlines
557 557 self.exists = True
558 558 except IOError:
559 559 pass
560 560 else:
561 561 self.ui.warn(_("unable to find '%s' for patching\n") % self.fname)
562 562
563 563 self.hash = {}
564 564 self.dirty = 0
565 565 self.offset = 0
566 566 self.skew = 0
567 567 self.rej = []
568 568 self.fileprinted = False
569 569 self.printfile(False)
570 570 self.hunks = 0
571 571
572 572 def writelines(self, fname, lines, mode):
573 573 if self.eolmode == 'auto':
574 574 eol = self.eol
575 575 elif self.eolmode == 'crlf':
576 576 eol = '\r\n'
577 577 else:
578 578 eol = '\n'
579 579
580 580 if self.eolmode != 'strict' and eol and eol != '\n':
581 581 rawlines = []
582 582 for l in lines:
583 583 if l and l[-1] == '\n':
584 584 l = l[:-1] + eol
585 585 rawlines.append(l)
586 586 lines = rawlines
587 587
588 588 self.backend.writelines(fname, lines, mode)
589 589
590 590 def printfile(self, warn):
591 591 if self.fileprinted:
592 592 return
593 593 if warn or self.ui.verbose:
594 594 self.fileprinted = True
595 595 s = _("patching file %s\n") % self.fname
596 596 if warn:
597 597 self.ui.warn(s)
598 598 else:
599 599 self.ui.note(s)
600 600
601 601
602 602 def findlines(self, l, linenum):
603 603 # looks through the hash and finds candidate lines. The
604 604 # result is a list of line numbers sorted based on distance
605 605 # from linenum
606 606
607 607 cand = self.hash.get(l, [])
608 608 if len(cand) > 1:
609 609 # resort our list of potentials forward then back.
610 610 cand.sort(key=lambda x: abs(x - linenum))
611 611 return cand
612 612
613 613 def write_rej(self):
614 614 # our rejects are a little different from patch(1). This always
615 615 # creates rejects in the same form as the original patch. A file
616 616 # header is inserted so that you can run the reject through patch again
617 617 # without having to type the filename.
618 618 if not self.rej:
619 619 return
620 620 base = os.path.basename(self.fname)
621 621 lines = ["--- %s\n+++ %s\n" % (base, base)]
622 622 for x in self.rej:
623 623 for l in x.hunk:
624 624 lines.append(l)
625 625 if l[-1] != '\n':
626 626 lines.append("\n\ No newline at end of file\n")
627 627 self.backend.writerej(self.fname, len(self.rej), self.hunks, lines)
628 628
629 629 def apply(self, h):
630 630 if not h.complete():
631 631 raise PatchError(_("bad hunk #%d %s (%d %d %d %d)") %
632 632 (h.number, h.desc, len(h.a), h.lena, len(h.b),
633 633 h.lenb))
634 634
635 635 self.hunks += 1
636 636
637 637 if self.missing:
638 638 self.rej.append(h)
639 639 return -1
640 640
641 641 if self.exists and h.createfile():
642 642 self.ui.warn(_("file %s already exists\n") % self.fname)
643 643 self.rej.append(h)
644 644 return -1
645 645
646 646 if isinstance(h, binhunk):
647 647 if h.rmfile():
648 648 self.backend.unlink(self.fname)
649 649 else:
650 650 self.lines[:] = h.new()
651 651 self.offset += len(h.new())
652 652 self.dirty = True
653 653 return 0
654 654
655 655 horig = h
656 656 if (self.eolmode in ('crlf', 'lf')
657 657 or self.eolmode == 'auto' and self.eol):
658 658 # If new eols are going to be normalized, then normalize
659 659 # hunk data before patching. Otherwise, preserve input
660 660 # line-endings.
661 661 h = h.getnormalized()
662 662
663 663 # fast case first, no offsets, no fuzz
664 664 old = h.old()
665 665 # patch starts counting at 1 unless we are adding the file
666 666 if h.starta == 0:
667 667 start = 0
668 668 else:
669 669 start = h.starta + self.offset - 1
670 670 orig_start = start
671 671 # if there's skew we want to emit the "(offset %d lines)" even
672 672 # when the hunk cleanly applies at start + skew, so skip the
673 673 # fast case code
674 674 if self.skew == 0 and diffhelpers.testhunk(old, self.lines, start) == 0:
675 675 if h.rmfile():
676 676 self.backend.unlink(self.fname)
677 677 else:
678 678 self.lines[start : start + h.lena] = h.new()
679 679 self.offset += h.lenb - h.lena
680 680 self.dirty = True
681 681 return 0
682 682
683 683 # ok, we couldn't match the hunk. Lets look for offsets and fuzz it
684 684 self.hash = {}
685 685 for x, s in enumerate(self.lines):
686 686 self.hash.setdefault(s, []).append(x)
687 687 if h.hunk[-1][0] != ' ':
688 688 # if the hunk tried to put something at the bottom of the file
689 689 # override the start line and use eof here
690 690 search_start = len(self.lines)
691 691 else:
692 692 search_start = orig_start + self.skew
693 693
694 694 for fuzzlen in xrange(3):
695 695 for toponly in [True, False]:
696 696 old = h.old(fuzzlen, toponly)
697 697
698 698 cand = self.findlines(old[0][1:], search_start)
699 699 for l in cand:
700 700 if diffhelpers.testhunk(old, self.lines, l) == 0:
701 701 newlines = h.new(fuzzlen, toponly)
702 702 self.lines[l : l + len(old)] = newlines
703 703 self.offset += len(newlines) - len(old)
704 704 self.skew = l - orig_start
705 705 self.dirty = True
706 706 offset = l - orig_start - fuzzlen
707 707 if fuzzlen:
708 708 msg = _("Hunk #%d succeeded at %d "
709 709 "with fuzz %d "
710 710 "(offset %d lines).\n")
711 711 self.printfile(True)
712 712 self.ui.warn(msg %
713 713 (h.number, l + 1, fuzzlen, offset))
714 714 else:
715 715 msg = _("Hunk #%d succeeded at %d "
716 716 "(offset %d lines).\n")
717 717 self.ui.note(msg % (h.number, l + 1, offset))
718 718 return fuzzlen
719 719 self.printfile(True)
720 720 self.ui.warn(_("Hunk #%d FAILED at %d\n") % (h.number, orig_start))
721 721 self.rej.append(horig)
722 722 return -1
723 723
724 724 def close(self):
725 725 if self.dirty:
726 726 self.writelines(self.fname, self.lines, self.mode)
727 727 self.write_rej()
728 728 return len(self.rej)
729 729
730 730 class hunk(object):
731 731 def __init__(self, desc, num, lr, context, create=False, remove=False):
732 732 self.number = num
733 733 self.desc = desc
734 734 self.hunk = [desc]
735 735 self.a = []
736 736 self.b = []
737 737 self.starta = self.lena = None
738 738 self.startb = self.lenb = None
739 739 if lr is not None:
740 740 if context:
741 741 self.read_context_hunk(lr)
742 742 else:
743 743 self.read_unified_hunk(lr)
744 744 self.create = create
745 745 self.remove = remove and not create
746 746
747 747 def getnormalized(self):
748 748 """Return a copy with line endings normalized to LF."""
749 749
750 750 def normalize(lines):
751 751 nlines = []
752 752 for line in lines:
753 753 if line.endswith('\r\n'):
754 754 line = line[:-2] + '\n'
755 755 nlines.append(line)
756 756 return nlines
757 757
758 758 # Dummy object, it is rebuilt manually
759 759 nh = hunk(self.desc, self.number, None, None, False, False)
760 760 nh.number = self.number
761 761 nh.desc = self.desc
762 762 nh.hunk = self.hunk
763 763 nh.a = normalize(self.a)
764 764 nh.b = normalize(self.b)
765 765 nh.starta = self.starta
766 766 nh.startb = self.startb
767 767 nh.lena = self.lena
768 768 nh.lenb = self.lenb
769 769 nh.create = self.create
770 770 nh.remove = self.remove
771 771 return nh
772 772
773 773 def read_unified_hunk(self, lr):
774 774 m = unidesc.match(self.desc)
775 775 if not m:
776 776 raise PatchError(_("bad hunk #%d") % self.number)
777 777 self.starta, foo, self.lena, self.startb, foo2, self.lenb = m.groups()
778 778 if self.lena is None:
779 779 self.lena = 1
780 780 else:
781 781 self.lena = int(self.lena)
782 782 if self.lenb is None:
783 783 self.lenb = 1
784 784 else:
785 785 self.lenb = int(self.lenb)
786 786 self.starta = int(self.starta)
787 787 self.startb = int(self.startb)
788 788 diffhelpers.addlines(lr, self.hunk, self.lena, self.lenb, self.a, self.b)
789 789 # if we hit eof before finishing out the hunk, the last line will
790 790 # be zero length. Lets try to fix it up.
791 791 while len(self.hunk[-1]) == 0:
792 792 del self.hunk[-1]
793 793 del self.a[-1]
794 794 del self.b[-1]
795 795 self.lena -= 1
796 796 self.lenb -= 1
797 797 self._fixnewline(lr)
798 798
799 799 def read_context_hunk(self, lr):
800 800 self.desc = lr.readline()
801 801 m = contextdesc.match(self.desc)
802 802 if not m:
803 803 raise PatchError(_("bad hunk #%d") % self.number)
804 804 foo, self.starta, foo2, aend, foo3 = m.groups()
805 805 self.starta = int(self.starta)
806 806 if aend is None:
807 807 aend = self.starta
808 808 self.lena = int(aend) - self.starta
809 809 if self.starta:
810 810 self.lena += 1
811 811 for x in xrange(self.lena):
812 812 l = lr.readline()
813 813 if l.startswith('---'):
814 814 # lines addition, old block is empty
815 815 lr.push(l)
816 816 break
817 817 s = l[2:]
818 818 if l.startswith('- ') or l.startswith('! '):
819 819 u = '-' + s
820 820 elif l.startswith(' '):
821 821 u = ' ' + s
822 822 else:
823 823 raise PatchError(_("bad hunk #%d old text line %d") %
824 824 (self.number, x))
825 825 self.a.append(u)
826 826 self.hunk.append(u)
827 827
828 828 l = lr.readline()
829 829 if l.startswith('\ '):
830 830 s = self.a[-1][:-1]
831 831 self.a[-1] = s
832 832 self.hunk[-1] = s
833 833 l = lr.readline()
834 834 m = contextdesc.match(l)
835 835 if not m:
836 836 raise PatchError(_("bad hunk #%d") % self.number)
837 837 foo, self.startb, foo2, bend, foo3 = m.groups()
838 838 self.startb = int(self.startb)
839 839 if bend is None:
840 840 bend = self.startb
841 841 self.lenb = int(bend) - self.startb
842 842 if self.startb:
843 843 self.lenb += 1
844 844 hunki = 1
845 845 for x in xrange(self.lenb):
846 846 l = lr.readline()
847 847 if l.startswith('\ '):
848 848 # XXX: the only way to hit this is with an invalid line range.
849 849 # The no-eol marker is not counted in the line range, but I
850 850 # guess there are diff(1) out there which behave differently.
851 851 s = self.b[-1][:-1]
852 852 self.b[-1] = s
853 853 self.hunk[hunki - 1] = s
854 854 continue
855 855 if not l:
856 856 # line deletions, new block is empty and we hit EOF
857 857 lr.push(l)
858 858 break
859 859 s = l[2:]
860 860 if l.startswith('+ ') or l.startswith('! '):
861 861 u = '+' + s
862 862 elif l.startswith(' '):
863 863 u = ' ' + s
864 864 elif len(self.b) == 0:
865 865 # line deletions, new block is empty
866 866 lr.push(l)
867 867 break
868 868 else:
869 869 raise PatchError(_("bad hunk #%d old text line %d") %
870 870 (self.number, x))
871 871 self.b.append(s)
872 872 while True:
873 873 if hunki >= len(self.hunk):
874 874 h = ""
875 875 else:
876 876 h = self.hunk[hunki]
877 877 hunki += 1
878 878 if h == u:
879 879 break
880 880 elif h.startswith('-'):
881 881 continue
882 882 else:
883 883 self.hunk.insert(hunki - 1, u)
884 884 break
885 885
886 886 if not self.a:
887 887 # this happens when lines were only added to the hunk
888 888 for x in self.hunk:
889 889 if x.startswith('-') or x.startswith(' '):
890 890 self.a.append(x)
891 891 if not self.b:
892 892 # this happens when lines were only deleted from the hunk
893 893 for x in self.hunk:
894 894 if x.startswith('+') or x.startswith(' '):
895 895 self.b.append(x[1:])
896 896 # @@ -start,len +start,len @@
897 897 self.desc = "@@ -%d,%d +%d,%d @@\n" % (self.starta, self.lena,
898 898 self.startb, self.lenb)
899 899 self.hunk[0] = self.desc
900 900 self._fixnewline(lr)
901 901
902 902 def _fixnewline(self, lr):
903 903 l = lr.readline()
904 904 if l.startswith('\ '):
905 905 diffhelpers.fix_newline(self.hunk, self.a, self.b)
906 906 else:
907 907 lr.push(l)
908 908
909 909 def complete(self):
910 910 return len(self.a) == self.lena and len(self.b) == self.lenb
911 911
912 912 def createfile(self):
913 913 return self.starta == 0 and self.lena == 0 and self.create
914 914
915 915 def rmfile(self):
916 916 return self.startb == 0 and self.lenb == 0 and self.remove
917 917
918 918 def fuzzit(self, l, fuzz, toponly):
919 919 # this removes context lines from the top and bottom of list 'l'. It
920 920 # checks the hunk to make sure only context lines are removed, and then
921 921 # returns a new shortened list of lines.
922 922 fuzz = min(fuzz, len(l)-1)
923 923 if fuzz:
924 924 top = 0
925 925 bot = 0
926 926 hlen = len(self.hunk)
927 927 for x in xrange(hlen - 1):
928 928 # the hunk starts with the @@ line, so use x+1
929 929 if self.hunk[x + 1][0] == ' ':
930 930 top += 1
931 931 else:
932 932 break
933 933 if not toponly:
934 934 for x in xrange(hlen - 1):
935 935 if self.hunk[hlen - bot - 1][0] == ' ':
936 936 bot += 1
937 937 else:
938 938 break
939 939
940 940 # top and bot now count context in the hunk
941 941 # adjust them if either one is short
942 942 context = max(top, bot, 3)
943 943 if bot < context:
944 944 bot = max(0, fuzz - (context - bot))
945 945 else:
946 946 bot = min(fuzz, bot)
947 947 if top < context:
948 948 top = max(0, fuzz - (context - top))
949 949 else:
950 950 top = min(fuzz, top)
951 951
952 952 return l[top:len(l)-bot]
953 953 return l
954 954
955 955 def old(self, fuzz=0, toponly=False):
956 956 return self.fuzzit(self.a, fuzz, toponly)
957 957
958 958 def new(self, fuzz=0, toponly=False):
959 959 return self.fuzzit(self.b, fuzz, toponly)
960 960
961 961 class binhunk:
962 962 'A binary patch file. Only understands literals so far.'
963 def __init__(self, gitpatch):
963 def __init__(self, gitpatch, lr):
964 964 self.gitpatch = gitpatch
965 965 self.text = None
966 966 self.hunk = ['GIT binary patch\n']
967 self._read(lr)
967 968
968 969 def createfile(self):
969 970 return self.gitpatch.op == 'ADD'
970 971
971 972 def rmfile(self):
972 973 return self.gitpatch.op == 'DELETE'
973 974
974 975 def complete(self):
975 976 return self.text is not None
976 977
977 978 def new(self):
978 979 return [self.text]
979 980
980 def extract(self, lr):
981 def _read(self, lr):
981 982 line = lr.readline()
982 983 self.hunk.append(line)
983 984 while line and not line.startswith('literal '):
984 985 line = lr.readline()
985 986 self.hunk.append(line)
986 987 if not line:
987 988 raise PatchError(_('could not extract binary patch'))
988 989 size = int(line[8:].rstrip())
989 990 dec = []
990 991 line = lr.readline()
991 992 self.hunk.append(line)
992 993 while len(line) > 1:
993 994 l = line[0]
994 995 if l <= 'Z' and l >= 'A':
995 996 l = ord(l) - ord('A') + 1
996 997 else:
997 998 l = ord(l) - ord('a') + 27
998 999 dec.append(base85.b85decode(line[1:-1])[:l])
999 1000 line = lr.readline()
1000 1001 self.hunk.append(line)
1001 1002 text = zlib.decompress(''.join(dec))
1002 1003 if len(text) != size:
1003 1004 raise PatchError(_('binary patch is %d bytes, not %d') %
1004 1005 len(text), size)
1005 1006 self.text = text
1006 1007
1007 1008 def parsefilename(str):
1008 1009 # --- filename \t|space stuff
1009 1010 s = str[4:].rstrip('\r\n')
1010 1011 i = s.find('\t')
1011 1012 if i < 0:
1012 1013 i = s.find(' ')
1013 1014 if i < 0:
1014 1015 return s
1015 1016 return s[:i]
1016 1017
1017 1018 def pathstrip(path, strip):
1018 1019 pathlen = len(path)
1019 1020 i = 0
1020 1021 if strip == 0:
1021 1022 return '', path.rstrip()
1022 1023 count = strip
1023 1024 while count > 0:
1024 1025 i = path.find('/', i)
1025 1026 if i == -1:
1026 1027 raise PatchError(_("unable to strip away %d of %d dirs from %s") %
1027 1028 (count, strip, path))
1028 1029 i += 1
1029 1030 # consume '//' in the path
1030 1031 while i < pathlen - 1 and path[i] == '/':
1031 1032 i += 1
1032 1033 count -= 1
1033 1034 return path[:i].lstrip(), path[i:].rstrip()
1034 1035
1035 1036 def selectfile(backend, afile_orig, bfile_orig, hunk, strip):
1036 1037 nulla = afile_orig == "/dev/null"
1037 1038 nullb = bfile_orig == "/dev/null"
1038 1039 abase, afile = pathstrip(afile_orig, strip)
1039 1040 gooda = not nulla and backend.exists(afile)
1040 1041 bbase, bfile = pathstrip(bfile_orig, strip)
1041 1042 if afile == bfile:
1042 1043 goodb = gooda
1043 1044 else:
1044 1045 goodb = not nullb and backend.exists(bfile)
1045 1046 createfunc = hunk.createfile
1046 1047 missing = not goodb and not gooda and not createfunc()
1047 1048
1048 1049 # some diff programs apparently produce patches where the afile is
1049 1050 # not /dev/null, but afile starts with bfile
1050 1051 abasedir = afile[:afile.rfind('/') + 1]
1051 1052 bbasedir = bfile[:bfile.rfind('/') + 1]
1052 1053 if missing and abasedir == bbasedir and afile.startswith(bfile):
1053 1054 # this isn't very pretty
1054 1055 hunk.create = True
1055 1056 if createfunc():
1056 1057 missing = False
1057 1058 else:
1058 1059 hunk.create = False
1059 1060
1060 1061 # If afile is "a/b/foo" and bfile is "a/b/foo.orig" we assume the
1061 1062 # diff is between a file and its backup. In this case, the original
1062 1063 # file should be patched (see original mpatch code).
1063 1064 isbackup = (abase == bbase and bfile.startswith(afile))
1064 1065 fname = None
1065 1066 if not missing:
1066 1067 if gooda and goodb:
1067 1068 fname = isbackup and afile or bfile
1068 1069 elif gooda:
1069 1070 fname = afile
1070 1071
1071 1072 if not fname:
1072 1073 if not nullb:
1073 1074 fname = isbackup and afile or bfile
1074 1075 elif not nulla:
1075 1076 fname = afile
1076 1077 else:
1077 1078 raise PatchError(_("undefined source and destination files"))
1078 1079
1079 1080 return fname, missing
1080 1081
1081 1082 def scangitpatch(lr, firstline):
1082 1083 """
1083 1084 Git patches can emit:
1084 1085 - rename a to b
1085 1086 - change b
1086 1087 - copy a to c
1087 1088 - change c
1088 1089
1089 1090 We cannot apply this sequence as-is, the renamed 'a' could not be
1090 1091 found for it would have been renamed already. And we cannot copy
1091 1092 from 'b' instead because 'b' would have been changed already. So
1092 1093 we scan the git patch for copy and rename commands so we can
1093 1094 perform the copies ahead of time.
1094 1095 """
1095 1096 pos = 0
1096 1097 try:
1097 1098 pos = lr.fp.tell()
1098 1099 fp = lr.fp
1099 1100 except IOError:
1100 1101 fp = cStringIO.StringIO(lr.fp.read())
1101 1102 gitlr = linereader(fp, lr.textmode)
1102 1103 gitlr.push(firstline)
1103 1104 gitpatches = readgitpatch(gitlr)
1104 1105 fp.seek(pos)
1105 1106 return gitpatches
1106 1107
1107 1108 def iterhunks(fp):
1108 1109 """Read a patch and yield the following events:
1109 1110 - ("file", afile, bfile, firsthunk): select a new target file.
1110 1111 - ("hunk", hunk): a new hunk is ready to be applied, follows a
1111 1112 "file" event.
1112 1113 - ("git", gitchanges): current diff is in git format, gitchanges
1113 1114 maps filenames to gitpatch records. Unique event.
1114 1115 """
1115 1116 changed = {}
1116 1117 afile = ""
1117 1118 bfile = ""
1118 1119 state = None
1119 1120 hunknum = 0
1120 1121 emitfile = newfile = False
1121 1122 git = False
1122 1123
1123 1124 # our states
1124 1125 BFILE = 1
1125 1126 context = None
1126 1127 lr = linereader(fp)
1127 1128
1128 1129 while True:
1129 1130 x = lr.readline()
1130 1131 if not x:
1131 1132 break
1132 1133 if state == BFILE and (
1133 1134 (not context and x[0] == '@')
1134 1135 or (context is not False and x.startswith('***************'))
1135 1136 or x.startswith('GIT binary patch')):
1136 1137 gp = changed.get(bfile)
1137 1138 if x.startswith('GIT binary patch'):
1138 h = binhunk(gp)
1139 h.extract(lr)
1139 h = binhunk(gp, lr)
1140 1140 afile = 'a/' + afile
1141 1141 bfile = 'b/' + bfile
1142 1142 else:
1143 1143 if context is None and x.startswith('***************'):
1144 1144 context = True
1145 1145 create = afile == '/dev/null' or gp and gp.op == 'ADD'
1146 1146 remove = bfile == '/dev/null' or gp and gp.op == 'DELETE'
1147 1147 h = hunk(x, hunknum + 1, lr, context, create, remove)
1148 1148 hunknum += 1
1149 1149 if emitfile:
1150 1150 emitfile = False
1151 1151 yield 'file', (afile, bfile, h, gp and gp.mode or None)
1152 1152 yield 'hunk', h
1153 1153 elif x.startswith('diff --git'):
1154 1154 # check for git diff, scanning the whole patch file if needed
1155 1155 m = gitre.match(x)
1156 1156 if m:
1157 1157 afile, bfile = m.group(1, 2)
1158 1158 if not git:
1159 1159 git = True
1160 1160 gitpatches = scangitpatch(lr, x)
1161 1161 yield 'git', gitpatches
1162 1162 for gp in gitpatches:
1163 1163 changed[gp.path] = gp
1164 1164 # else error?
1165 1165 # copy/rename + modify should modify target, not source
1166 1166 gp = changed.get(bfile)
1167 1167 if gp and (gp.op in ('COPY', 'DELETE', 'RENAME', 'ADD')
1168 1168 or gp.mode):
1169 1169 afile = bfile
1170 1170 newfile = True
1171 1171 elif x.startswith('---'):
1172 1172 # check for a unified diff
1173 1173 l2 = lr.readline()
1174 1174 if not l2.startswith('+++'):
1175 1175 lr.push(l2)
1176 1176 continue
1177 1177 newfile = True
1178 1178 context = False
1179 1179 afile = parsefilename(x)
1180 1180 bfile = parsefilename(l2)
1181 1181 elif x.startswith('***'):
1182 1182 # check for a context diff
1183 1183 l2 = lr.readline()
1184 1184 if not l2.startswith('---'):
1185 1185 lr.push(l2)
1186 1186 continue
1187 1187 l3 = lr.readline()
1188 1188 lr.push(l3)
1189 1189 if not l3.startswith("***************"):
1190 1190 lr.push(l2)
1191 1191 continue
1192 1192 newfile = True
1193 1193 context = True
1194 1194 afile = parsefilename(x)
1195 1195 bfile = parsefilename(l2)
1196 1196
1197 1197 if newfile:
1198 1198 newfile = False
1199 1199 emitfile = True
1200 1200 state = BFILE
1201 1201 hunknum = 0
1202 1202
1203 1203 def applydiff(ui, fp, changed, backend, strip=1, eolmode='strict'):
1204 1204 """Reads a patch from fp and tries to apply it.
1205 1205
1206 1206 The dict 'changed' is filled in with all of the filenames changed
1207 1207 by the patch. Returns 0 for a clean patch, -1 if any rejects were
1208 1208 found and 1 if there was any fuzz.
1209 1209
1210 1210 If 'eolmode' is 'strict', the patch content and patched file are
1211 1211 read in binary mode. Otherwise, line endings are ignored when
1212 1212 patching then normalized according to 'eolmode'.
1213 1213 """
1214 1214 return _applydiff(ui, fp, patchfile, backend, changed, strip=strip,
1215 1215 eolmode=eolmode)
1216 1216
1217 1217 def _applydiff(ui, fp, patcher, backend, changed, strip=1, eolmode='strict'):
1218 1218 rejects = 0
1219 1219 err = 0
1220 1220 current_file = None
1221 1221
1222 1222 for state, values in iterhunks(fp):
1223 1223 if state == 'hunk':
1224 1224 if not current_file:
1225 1225 continue
1226 1226 ret = current_file.apply(values)
1227 1227 if ret >= 0:
1228 1228 changed.setdefault(current_file.fname, None)
1229 1229 if ret > 0:
1230 1230 err = 1
1231 1231 elif state == 'file':
1232 1232 if current_file:
1233 1233 rejects += current_file.close()
1234 1234 afile, bfile, first_hunk, mode = values
1235 1235 try:
1236 1236 current_file, missing = selectfile(backend, afile, bfile,
1237 1237 first_hunk, strip)
1238 1238 current_file = patcher(ui, current_file, backend, mode,
1239 1239 missing=missing, eolmode=eolmode)
1240 1240 except PatchError, inst:
1241 1241 ui.warn(str(inst) + '\n')
1242 1242 current_file = None
1243 1243 rejects += 1
1244 1244 continue
1245 1245 elif state == 'git':
1246 1246 for gp in values:
1247 1247 gp.path = pathstrip(gp.path, strip - 1)[1]
1248 1248 if gp.oldpath:
1249 1249 gp.oldpath = pathstrip(gp.oldpath, strip - 1)[1]
1250 1250 if gp.op in ('COPY', 'RENAME'):
1251 1251 backend.copy(gp.oldpath, gp.path)
1252 1252 changed[gp.path] = gp
1253 1253 else:
1254 1254 raise util.Abort(_('unsupported parser state: %s') % state)
1255 1255
1256 1256 if current_file:
1257 1257 rejects += current_file.close()
1258 1258
1259 1259 # Handle mode changes without hunk
1260 1260 removed = set()
1261 1261 for gp in changed.itervalues():
1262 1262 if not gp:
1263 1263 continue
1264 1264 if gp.op == 'DELETE':
1265 1265 removed.add(gp.path)
1266 1266 continue
1267 1267 if gp.op == 'RENAME':
1268 1268 removed.add(gp.oldpath)
1269 1269 if gp.mode:
1270 1270 if gp.op == 'ADD' and not backend.exists(gp.path):
1271 1271 # Added files without content have no hunk and must be created
1272 1272 backend.writelines(gp.path, [], gp.mode)
1273 1273 else:
1274 1274 backend.setmode(gp.path, gp.mode[0], gp.mode[1])
1275 1275 for path in sorted(removed):
1276 1276 backend.unlink(path)
1277 1277
1278 1278 if rejects:
1279 1279 return -1
1280 1280 return err
1281 1281
1282 1282 def _externalpatch(ui, repo, patcher, patchname, strip, files,
1283 1283 similarity):
1284 1284 """use <patcher> to apply <patchname> to the working directory.
1285 1285 returns whether patch was applied with fuzz factor."""
1286 1286
1287 1287 fuzz = False
1288 1288 args = []
1289 1289 cwd = repo.root
1290 1290 if cwd:
1291 1291 args.append('-d %s' % util.shellquote(cwd))
1292 1292 fp = util.popen('%s %s -p%d < %s' % (patcher, ' '.join(args), strip,
1293 1293 util.shellquote(patchname)))
1294 1294 try:
1295 1295 for line in fp:
1296 1296 line = line.rstrip()
1297 1297 ui.note(line + '\n')
1298 1298 if line.startswith('patching file '):
1299 1299 pf = util.parsepatchoutput(line)
1300 1300 printed_file = False
1301 1301 files.setdefault(pf, None)
1302 1302 elif line.find('with fuzz') >= 0:
1303 1303 fuzz = True
1304 1304 if not printed_file:
1305 1305 ui.warn(pf + '\n')
1306 1306 printed_file = True
1307 1307 ui.warn(line + '\n')
1308 1308 elif line.find('saving rejects to file') >= 0:
1309 1309 ui.warn(line + '\n')
1310 1310 elif line.find('FAILED') >= 0:
1311 1311 if not printed_file:
1312 1312 ui.warn(pf + '\n')
1313 1313 printed_file = True
1314 1314 ui.warn(line + '\n')
1315 1315 finally:
1316 1316 if files:
1317 1317 cfiles = list(files)
1318 1318 cwd = repo.getcwd()
1319 1319 if cwd:
1320 1320 cfiles = [util.pathto(repo.root, cwd, f)
1321 1321 for f in cfile]
1322 1322 scmutil.addremove(repo, cfiles, similarity=similarity)
1323 1323 code = fp.close()
1324 1324 if code:
1325 1325 raise PatchError(_("patch command failed: %s") %
1326 1326 util.explainexit(code)[0])
1327 1327 return fuzz
1328 1328
1329 1329 def internalpatch(ui, repo, patchobj, strip, files=None, eolmode='strict',
1330 1330 similarity=0):
1331 1331 """use builtin patch to apply <patchobj> to the working directory.
1332 1332 returns whether patch was applied with fuzz factor."""
1333 1333
1334 1334 if files is None:
1335 1335 files = {}
1336 1336 if eolmode is None:
1337 1337 eolmode = ui.config('patch', 'eol', 'strict')
1338 1338 if eolmode.lower() not in eolmodes:
1339 1339 raise util.Abort(_('unsupported line endings type: %s') % eolmode)
1340 1340 eolmode = eolmode.lower()
1341 1341
1342 1342 backend = workingbackend(ui, repo, similarity)
1343 1343 try:
1344 1344 fp = open(patchobj, 'rb')
1345 1345 except TypeError:
1346 1346 fp = patchobj
1347 1347 try:
1348 1348 ret = applydiff(ui, fp, files, backend, strip=strip, eolmode=eolmode)
1349 1349 finally:
1350 1350 if fp != patchobj:
1351 1351 fp.close()
1352 1352 files.update(dict.fromkeys(backend.close()))
1353 1353 if ret < 0:
1354 1354 raise PatchError(_('patch failed to apply'))
1355 1355 return ret > 0
1356 1356
1357 1357 def patch(ui, repo, patchname, strip=1, files=None, eolmode='strict',
1358 1358 similarity=0):
1359 1359 """Apply <patchname> to the working directory.
1360 1360
1361 1361 'eolmode' specifies how end of lines should be handled. It can be:
1362 1362 - 'strict': inputs are read in binary mode, EOLs are preserved
1363 1363 - 'crlf': EOLs are ignored when patching and reset to CRLF
1364 1364 - 'lf': EOLs are ignored when patching and reset to LF
1365 1365 - None: get it from user settings, default to 'strict'
1366 1366 'eolmode' is ignored when using an external patcher program.
1367 1367
1368 1368 Returns whether patch was applied with fuzz factor.
1369 1369 """
1370 1370 patcher = ui.config('ui', 'patch')
1371 1371 if files is None:
1372 1372 files = {}
1373 1373 try:
1374 1374 if patcher:
1375 1375 return _externalpatch(ui, repo, patcher, patchname, strip,
1376 1376 files, similarity)
1377 1377 return internalpatch(ui, repo, patchname, strip, files, eolmode,
1378 1378 similarity)
1379 1379 except PatchError, err:
1380 1380 raise util.Abort(str(err))
1381 1381
1382 1382 def changedfiles(ui, repo, patchpath, strip=1):
1383 1383 backend = fsbackend(ui, repo.root)
1384 1384 fp = open(patchpath, 'rb')
1385 1385 try:
1386 1386 changed = set()
1387 1387 for state, values in iterhunks(fp):
1388 1388 if state == 'hunk':
1389 1389 continue
1390 1390 elif state == 'file':
1391 1391 afile, bfile, first_hunk, mode = values
1392 1392 current_file, missing = selectfile(backend, afile, bfile,
1393 1393 first_hunk, strip)
1394 1394 changed.add(current_file)
1395 1395 elif state == 'git':
1396 1396 for gp in values:
1397 1397 gp.path = pathstrip(gp.path, strip - 1)[1]
1398 1398 changed.add(gp.path)
1399 1399 if gp.oldpath:
1400 1400 gp.oldpath = pathstrip(gp.oldpath, strip - 1)[1]
1401 1401 if gp.op == 'RENAME':
1402 1402 changed.add(gp.oldpath)
1403 1403 else:
1404 1404 raise util.Abort(_('unsupported parser state: %s') % state)
1405 1405 return changed
1406 1406 finally:
1407 1407 fp.close()
1408 1408
1409 1409 def b85diff(to, tn):
1410 1410 '''print base85-encoded binary diff'''
1411 1411 def gitindex(text):
1412 1412 if not text:
1413 1413 return hex(nullid)
1414 1414 l = len(text)
1415 1415 s = util.sha1('blob %d\0' % l)
1416 1416 s.update(text)
1417 1417 return s.hexdigest()
1418 1418
1419 1419 def fmtline(line):
1420 1420 l = len(line)
1421 1421 if l <= 26:
1422 1422 l = chr(ord('A') + l - 1)
1423 1423 else:
1424 1424 l = chr(l - 26 + ord('a') - 1)
1425 1425 return '%c%s\n' % (l, base85.b85encode(line, True))
1426 1426
1427 1427 def chunk(text, csize=52):
1428 1428 l = len(text)
1429 1429 i = 0
1430 1430 while i < l:
1431 1431 yield text[i:i + csize]
1432 1432 i += csize
1433 1433
1434 1434 tohash = gitindex(to)
1435 1435 tnhash = gitindex(tn)
1436 1436 if tohash == tnhash:
1437 1437 return ""
1438 1438
1439 1439 # TODO: deltas
1440 1440 ret = ['index %s..%s\nGIT binary patch\nliteral %s\n' %
1441 1441 (tohash, tnhash, len(tn))]
1442 1442 for l in chunk(zlib.compress(tn)):
1443 1443 ret.append(fmtline(l))
1444 1444 ret.append('\n')
1445 1445 return ''.join(ret)
1446 1446
1447 1447 class GitDiffRequired(Exception):
1448 1448 pass
1449 1449
1450 1450 def diffopts(ui, opts=None, untrusted=False):
1451 1451 def get(key, name=None, getter=ui.configbool):
1452 1452 return ((opts and opts.get(key)) or
1453 1453 getter('diff', name or key, None, untrusted=untrusted))
1454 1454 return mdiff.diffopts(
1455 1455 text=opts and opts.get('text'),
1456 1456 git=get('git'),
1457 1457 nodates=get('nodates'),
1458 1458 showfunc=get('show_function', 'showfunc'),
1459 1459 ignorews=get('ignore_all_space', 'ignorews'),
1460 1460 ignorewsamount=get('ignore_space_change', 'ignorewsamount'),
1461 1461 ignoreblanklines=get('ignore_blank_lines', 'ignoreblanklines'),
1462 1462 context=get('unified', getter=ui.config))
1463 1463
1464 1464 def diff(repo, node1=None, node2=None, match=None, changes=None, opts=None,
1465 1465 losedatafn=None, prefix=''):
1466 1466 '''yields diff of changes to files between two nodes, or node and
1467 1467 working directory.
1468 1468
1469 1469 if node1 is None, use first dirstate parent instead.
1470 1470 if node2 is None, compare node1 with working directory.
1471 1471
1472 1472 losedatafn(**kwarg) is a callable run when opts.upgrade=True and
1473 1473 every time some change cannot be represented with the current
1474 1474 patch format. Return False to upgrade to git patch format, True to
1475 1475 accept the loss or raise an exception to abort the diff. It is
1476 1476 called with the name of current file being diffed as 'fn'. If set
1477 1477 to None, patches will always be upgraded to git format when
1478 1478 necessary.
1479 1479
1480 1480 prefix is a filename prefix that is prepended to all filenames on
1481 1481 display (used for subrepos).
1482 1482 '''
1483 1483
1484 1484 if opts is None:
1485 1485 opts = mdiff.defaultopts
1486 1486
1487 1487 if not node1 and not node2:
1488 1488 node1 = repo.dirstate.p1()
1489 1489
1490 1490 def lrugetfilectx():
1491 1491 cache = {}
1492 1492 order = []
1493 1493 def getfilectx(f, ctx):
1494 1494 fctx = ctx.filectx(f, filelog=cache.get(f))
1495 1495 if f not in cache:
1496 1496 if len(cache) > 20:
1497 1497 del cache[order.pop(0)]
1498 1498 cache[f] = fctx.filelog()
1499 1499 else:
1500 1500 order.remove(f)
1501 1501 order.append(f)
1502 1502 return fctx
1503 1503 return getfilectx
1504 1504 getfilectx = lrugetfilectx()
1505 1505
1506 1506 ctx1 = repo[node1]
1507 1507 ctx2 = repo[node2]
1508 1508
1509 1509 if not changes:
1510 1510 changes = repo.status(ctx1, ctx2, match=match)
1511 1511 modified, added, removed = changes[:3]
1512 1512
1513 1513 if not modified and not added and not removed:
1514 1514 return []
1515 1515
1516 1516 revs = None
1517 1517 if not repo.ui.quiet:
1518 1518 hexfunc = repo.ui.debugflag and hex or short
1519 1519 revs = [hexfunc(node) for node in [node1, node2] if node]
1520 1520
1521 1521 copy = {}
1522 1522 if opts.git or opts.upgrade:
1523 1523 copy = copies.copies(repo, ctx1, ctx2, repo[nullid])[0]
1524 1524
1525 1525 difffn = lambda opts, losedata: trydiff(repo, revs, ctx1, ctx2,
1526 1526 modified, added, removed, copy, getfilectx, opts, losedata, prefix)
1527 1527 if opts.upgrade and not opts.git:
1528 1528 try:
1529 1529 def losedata(fn):
1530 1530 if not losedatafn or not losedatafn(fn=fn):
1531 1531 raise GitDiffRequired()
1532 1532 # Buffer the whole output until we are sure it can be generated
1533 1533 return list(difffn(opts.copy(git=False), losedata))
1534 1534 except GitDiffRequired:
1535 1535 return difffn(opts.copy(git=True), None)
1536 1536 else:
1537 1537 return difffn(opts, None)
1538 1538
1539 1539 def difflabel(func, *args, **kw):
1540 1540 '''yields 2-tuples of (output, label) based on the output of func()'''
1541 1541 prefixes = [('diff', 'diff.diffline'),
1542 1542 ('copy', 'diff.extended'),
1543 1543 ('rename', 'diff.extended'),
1544 1544 ('old', 'diff.extended'),
1545 1545 ('new', 'diff.extended'),
1546 1546 ('deleted', 'diff.extended'),
1547 1547 ('---', 'diff.file_a'),
1548 1548 ('+++', 'diff.file_b'),
1549 1549 ('@@', 'diff.hunk'),
1550 1550 ('-', 'diff.deleted'),
1551 1551 ('+', 'diff.inserted')]
1552 1552
1553 1553 for chunk in func(*args, **kw):
1554 1554 lines = chunk.split('\n')
1555 1555 for i, line in enumerate(lines):
1556 1556 if i != 0:
1557 1557 yield ('\n', '')
1558 1558 stripline = line
1559 1559 if line and line[0] in '+-':
1560 1560 # highlight trailing whitespace, but only in changed lines
1561 1561 stripline = line.rstrip()
1562 1562 for prefix, label in prefixes:
1563 1563 if stripline.startswith(prefix):
1564 1564 yield (stripline, label)
1565 1565 break
1566 1566 else:
1567 1567 yield (line, '')
1568 1568 if line != stripline:
1569 1569 yield (line[len(stripline):], 'diff.trailingwhitespace')
1570 1570
1571 1571 def diffui(*args, **kw):
1572 1572 '''like diff(), but yields 2-tuples of (output, label) for ui.write()'''
1573 1573 return difflabel(diff, *args, **kw)
1574 1574
1575 1575
1576 1576 def _addmodehdr(header, omode, nmode):
1577 1577 if omode != nmode:
1578 1578 header.append('old mode %s\n' % omode)
1579 1579 header.append('new mode %s\n' % nmode)
1580 1580
1581 1581 def trydiff(repo, revs, ctx1, ctx2, modified, added, removed,
1582 1582 copy, getfilectx, opts, losedatafn, prefix):
1583 1583
1584 1584 def join(f):
1585 1585 return os.path.join(prefix, f)
1586 1586
1587 1587 date1 = util.datestr(ctx1.date())
1588 1588 man1 = ctx1.manifest()
1589 1589
1590 1590 gone = set()
1591 1591 gitmode = {'l': '120000', 'x': '100755', '': '100644'}
1592 1592
1593 1593 copyto = dict([(v, k) for k, v in copy.items()])
1594 1594
1595 1595 if opts.git:
1596 1596 revs = None
1597 1597
1598 1598 for f in sorted(modified + added + removed):
1599 1599 to = None
1600 1600 tn = None
1601 1601 dodiff = True
1602 1602 header = []
1603 1603 if f in man1:
1604 1604 to = getfilectx(f, ctx1).data()
1605 1605 if f not in removed:
1606 1606 tn = getfilectx(f, ctx2).data()
1607 1607 a, b = f, f
1608 1608 if opts.git or losedatafn:
1609 1609 if f in added:
1610 1610 mode = gitmode[ctx2.flags(f)]
1611 1611 if f in copy or f in copyto:
1612 1612 if opts.git:
1613 1613 if f in copy:
1614 1614 a = copy[f]
1615 1615 else:
1616 1616 a = copyto[f]
1617 1617 omode = gitmode[man1.flags(a)]
1618 1618 _addmodehdr(header, omode, mode)
1619 1619 if a in removed and a not in gone:
1620 1620 op = 'rename'
1621 1621 gone.add(a)
1622 1622 else:
1623 1623 op = 'copy'
1624 1624 header.append('%s from %s\n' % (op, join(a)))
1625 1625 header.append('%s to %s\n' % (op, join(f)))
1626 1626 to = getfilectx(a, ctx1).data()
1627 1627 else:
1628 1628 losedatafn(f)
1629 1629 else:
1630 1630 if opts.git:
1631 1631 header.append('new file mode %s\n' % mode)
1632 1632 elif ctx2.flags(f):
1633 1633 losedatafn(f)
1634 1634 # In theory, if tn was copied or renamed we should check
1635 1635 # if the source is binary too but the copy record already
1636 1636 # forces git mode.
1637 1637 if util.binary(tn):
1638 1638 if opts.git:
1639 1639 dodiff = 'binary'
1640 1640 else:
1641 1641 losedatafn(f)
1642 1642 if not opts.git and not tn:
1643 1643 # regular diffs cannot represent new empty file
1644 1644 losedatafn(f)
1645 1645 elif f in removed:
1646 1646 if opts.git:
1647 1647 # have we already reported a copy above?
1648 1648 if ((f in copy and copy[f] in added
1649 1649 and copyto[copy[f]] == f) or
1650 1650 (f in copyto and copyto[f] in added
1651 1651 and copy[copyto[f]] == f)):
1652 1652 dodiff = False
1653 1653 else:
1654 1654 header.append('deleted file mode %s\n' %
1655 1655 gitmode[man1.flags(f)])
1656 1656 elif not to or util.binary(to):
1657 1657 # regular diffs cannot represent empty file deletion
1658 1658 losedatafn(f)
1659 1659 else:
1660 1660 oflag = man1.flags(f)
1661 1661 nflag = ctx2.flags(f)
1662 1662 binary = util.binary(to) or util.binary(tn)
1663 1663 if opts.git:
1664 1664 _addmodehdr(header, gitmode[oflag], gitmode[nflag])
1665 1665 if binary:
1666 1666 dodiff = 'binary'
1667 1667 elif binary or nflag != oflag:
1668 1668 losedatafn(f)
1669 1669 if opts.git:
1670 1670 header.insert(0, mdiff.diffline(revs, join(a), join(b), opts))
1671 1671
1672 1672 if dodiff:
1673 1673 if dodiff == 'binary':
1674 1674 text = b85diff(to, tn)
1675 1675 else:
1676 1676 text = mdiff.unidiff(to, date1,
1677 1677 # ctx2 date may be dynamic
1678 1678 tn, util.datestr(ctx2.date()),
1679 1679 join(a), join(b), revs, opts=opts)
1680 1680 if header and (text or len(header) > 1):
1681 1681 yield ''.join(header)
1682 1682 if text:
1683 1683 yield text
1684 1684
1685 1685 def diffstatdata(lines):
1686 1686 diffre = re.compile('^diff .*-r [a-z0-9]+\s(.*)$')
1687 1687
1688 1688 filename, adds, removes = None, 0, 0
1689 1689 for line in lines:
1690 1690 if line.startswith('diff'):
1691 1691 if filename:
1692 1692 isbinary = adds == 0 and removes == 0
1693 1693 yield (filename, adds, removes, isbinary)
1694 1694 # set numbers to 0 anyway when starting new file
1695 1695 adds, removes = 0, 0
1696 1696 if line.startswith('diff --git'):
1697 1697 filename = gitre.search(line).group(1)
1698 1698 elif line.startswith('diff -r'):
1699 1699 # format: "diff -r ... -r ... filename"
1700 1700 filename = diffre.search(line).group(1)
1701 1701 elif line.startswith('+') and not line.startswith('+++'):
1702 1702 adds += 1
1703 1703 elif line.startswith('-') and not line.startswith('---'):
1704 1704 removes += 1
1705 1705 if filename:
1706 1706 isbinary = adds == 0 and removes == 0
1707 1707 yield (filename, adds, removes, isbinary)
1708 1708
1709 1709 def diffstat(lines, width=80, git=False):
1710 1710 output = []
1711 1711 stats = list(diffstatdata(lines))
1712 1712
1713 1713 maxtotal, maxname = 0, 0
1714 1714 totaladds, totalremoves = 0, 0
1715 1715 hasbinary = False
1716 1716
1717 1717 sized = [(filename, adds, removes, isbinary, encoding.colwidth(filename))
1718 1718 for filename, adds, removes, isbinary in stats]
1719 1719
1720 1720 for filename, adds, removes, isbinary, namewidth in sized:
1721 1721 totaladds += adds
1722 1722 totalremoves += removes
1723 1723 maxname = max(maxname, namewidth)
1724 1724 maxtotal = max(maxtotal, adds + removes)
1725 1725 if isbinary:
1726 1726 hasbinary = True
1727 1727
1728 1728 countwidth = len(str(maxtotal))
1729 1729 if hasbinary and countwidth < 3:
1730 1730 countwidth = 3
1731 1731 graphwidth = width - countwidth - maxname - 6
1732 1732 if graphwidth < 10:
1733 1733 graphwidth = 10
1734 1734
1735 1735 def scale(i):
1736 1736 if maxtotal <= graphwidth:
1737 1737 return i
1738 1738 # If diffstat runs out of room it doesn't print anything,
1739 1739 # which isn't very useful, so always print at least one + or -
1740 1740 # if there were at least some changes.
1741 1741 return max(i * graphwidth // maxtotal, int(bool(i)))
1742 1742
1743 1743 for filename, adds, removes, isbinary, namewidth in sized:
1744 1744 if git and isbinary:
1745 1745 count = 'Bin'
1746 1746 else:
1747 1747 count = adds + removes
1748 1748 pluses = '+' * scale(adds)
1749 1749 minuses = '-' * scale(removes)
1750 1750 output.append(' %s%s | %*s %s%s\n' %
1751 1751 (filename, ' ' * (maxname - namewidth),
1752 1752 countwidth, count,
1753 1753 pluses, minuses))
1754 1754
1755 1755 if stats:
1756 1756 output.append(_(' %d files changed, %d insertions(+), %d deletions(-)\n')
1757 1757 % (len(stats), totaladds, totalremoves))
1758 1758
1759 1759 return ''.join(output)
1760 1760
1761 1761 def diffstatui(*args, **kw):
1762 1762 '''like diffstat(), but yields 2-tuples of (output, label) for
1763 1763 ui.write()
1764 1764 '''
1765 1765
1766 1766 for line in diffstat(*args, **kw).splitlines():
1767 1767 if line and line[-1] in '+-':
1768 1768 name, graph = line.rsplit(' ', 1)
1769 1769 yield (name + ' ', '')
1770 1770 m = re.search(r'\++', graph)
1771 1771 if m:
1772 1772 yield (m.group(0), 'diffstat.inserted')
1773 1773 m = re.search(r'-+', graph)
1774 1774 if m:
1775 1775 yield (m.group(0), 'diffstat.deleted')
1776 1776 else:
1777 1777 yield (line, '')
1778 1778 yield ('\n', '')
General Comments 0
You need to be logged in to leave comments. Login now