patch.py
2478 lines
| 84.4 KiB
| text/x-python
|
PythonLexer
/ mercurial / patch.py
Brendan Cully
|
r2861 | # patch.py - patch file parsing routines | ||
# | ||||
Vadim Gelfer
|
r2865 | # Copyright 2006 Brendan Cully <brendan@kublai.com> | ||
Bryan O'Sullivan
|
r4897 | # Copyright 2007 Chris Mason <chris.mason@oracle.com> | ||
Vadim Gelfer
|
r2865 | # | ||
Martin Geisler
|
r8225 | # This software may be used and distributed according to the terms of the | ||
Matt Mackall
|
r10263 | # GNU General Public License version 2 or any later version. | ||
Brendan Cully
|
r2861 | |||
Martin von Zweigbergk
|
r25113 | import collections | ||
Laurent Charignon
|
r24269 | import cStringIO, email, os, errno, re, posixpath, copy | ||
Patrick Mezard
|
r14452 | import tempfile, zlib, shutil | ||
Augie Fackler
|
r19810 | # On python2.4 you have to import these by name or they fail to | ||
# load. This was not a problem on Python 2.7. | ||||
import email.Generator | ||||
import email.Parser | ||||
Augie Fackler
|
r10965 | |||
Matt Mackall
|
r3891 | from i18n import _ | ||
Johan Bjork
|
r19875 | from node import hex, short | ||
Patrick Mezard
|
r14611 | import base85, mdiff, scmutil, util, diffhelpers, copies, encoding, error | ||
Siddharth Agarwal
|
r24390 | import pathutil | ||
Vadim Gelfer
|
r2866 | |||
Dirkjan Ochtman
|
r7199 | gitre = re.compile('diff --git a/(.*) b/(.*)') | ||
Jordi Gutiérrez Hermoso
|
r22460 | tabsplitter = re.compile(r'(\t+|[^\t]+)') | ||
Dirkjan Ochtman
|
r7199 | |||
Bryan O'Sullivan
|
r4897 | class PatchError(Exception): | ||
pass | ||||
Brendan Cully
|
r2933 | |||
# public functions | ||||
Brendan Cully
|
r10384 | def split(stream): | ||
'''return an iterator of individual patches from a stream''' | ||||
def isheader(line, inheader): | ||||
if inheader and line[0] in (' ', '\t'): | ||||
# continuation | ||||
return True | ||||
Peter Arrenbrecht
|
r10883 | if line[0] in (' ', '-', '+'): | ||
# diff line - don't check for header pattern in there | ||||
return False | ||||
Brendan Cully
|
r10384 | l = line.split(': ', 1) | ||
return len(l) == 2 and ' ' not in l[0] | ||||
def chunk(lines): | ||||
return cStringIO.StringIO(''.join(lines)) | ||||
def hgsplit(stream, cur): | ||||
inheader = True | ||||
for line in stream: | ||||
if not line.strip(): | ||||
inheader = False | ||||
if not inheader and line.startswith('# HG changeset patch'): | ||||
yield chunk(cur) | ||||
cur = [] | ||||
inheader = True | ||||
cur.append(line) | ||||
if cur: | ||||
yield chunk(cur) | ||||
def mboxsplit(stream, cur): | ||||
for line in stream: | ||||
if line.startswith('From '): | ||||
for c in split(chunk(cur[1:])): | ||||
yield c | ||||
cur = [] | ||||
cur.append(line) | ||||
if cur: | ||||
for c in split(chunk(cur[1:])): | ||||
yield c | ||||
def mimesplit(stream, cur): | ||||
def msgfp(m): | ||||
fp = cStringIO.StringIO() | ||||
g = email.Generator.Generator(fp, mangle_from_=False) | ||||
g.flatten(m) | ||||
fp.seek(0) | ||||
return fp | ||||
for line in stream: | ||||
cur.append(line) | ||||
c = chunk(cur) | ||||
m = email.Parser.Parser().parse(c) | ||||
if not m.is_multipart(): | ||||
yield msgfp(m) | ||||
else: | ||||
ok_types = ('text/plain', 'text/x-diff', 'text/x-patch') | ||||
for part in m.walk(): | ||||
ct = part.get_content_type() | ||||
if ct not in ok_types: | ||||
continue | ||||
yield msgfp(part) | ||||
def headersplit(stream, cur): | ||||
inheader = False | ||||
for line in stream: | ||||
if not inheader and isheader(line, inheader): | ||||
yield chunk(cur) | ||||
cur = [] | ||||
inheader = True | ||||
if inheader and not isheader(line, inheader): | ||||
inheader = False | ||||
cur.append(line) | ||||
if cur: | ||||
yield chunk(cur) | ||||
def remainder(cur): | ||||
yield chunk(cur) | ||||
class fiter(object): | ||||
def __init__(self, fp): | ||||
self.fp = fp | ||||
def __iter__(self): | ||||
return self | ||||
def next(self): | ||||
l = self.fp.readline() | ||||
if not l: | ||||
raise StopIteration | ||||
return l | ||||
inheader = False | ||||
cur = [] | ||||
mimeheaders = ['content-type'] | ||||
Augie Fackler
|
r14966 | if not util.safehasattr(stream, 'next'): | ||
Brendan Cully
|
r10384 | # http responses, for example, have readline but not next | ||
stream = fiter(stream) | ||||
for line in stream: | ||||
cur.append(line) | ||||
if line.startswith('# HG changeset patch'): | ||||
return hgsplit(stream, cur) | ||||
elif line.startswith('From '): | ||||
return mboxsplit(stream, cur) | ||||
elif isheader(line, inheader): | ||||
inheader = True | ||||
if line.split(':', 1)[0].lower() in mimeheaders: | ||||
# let email parser handle this | ||||
return mimesplit(stream, cur) | ||||
Brendan Cully
|
r10501 | elif line.startswith('--- ') and inheader: | ||
# No evil headers seen by diff start, split by hand | ||||
Brendan Cully
|
r10384 | return headersplit(stream, cur) | ||
# Not enough info, keep reading | ||||
# if we are here, we have a very plain patch | ||||
return remainder(cur) | ||||
Vadim Gelfer
|
r2866 | def extract(ui, fileobj): | ||
'''extract patch from data read from fileobj. | ||||
Brendan Cully
|
r4263 | patch can be a normal patch or contained in an email message. | ||
Vadim Gelfer
|
r2866 | |||
Dan Drake
|
r11645 | return tuple (filename, message, user, date, branch, node, p1, p2). | ||
Brendan Cully
|
r4263 | Any item in the returned tuple can be None. If filename is None, | ||
fileobj did not contain a patch. Caller must unlink filename when done.''' | ||||
Vadim Gelfer
|
r2866 | |||
# attempt to detect the start of a patch | ||||
# (this heuristic is borrowed from quilt) | ||||
Martin Geisler
|
r7736 | diffre = re.compile(r'^(?:Index:[ \t]|diff[ \t]|RCS file: |' | ||
r'retrieving revision [0-9]+(\.[0-9]+)*$|' | ||||
Benoit Boissinot
|
r10736 | r'---[ \t].*?^\+\+\+[ \t]|' | ||
r'\*\*\*[ \t].*?^---[ \t])', re.MULTILINE|re.DOTALL) | ||||
Vadim Gelfer
|
r2866 | |||
fd, tmpname = tempfile.mkstemp(prefix='hg-patch-') | ||||
tmpfp = os.fdopen(fd, 'w') | ||||
try: | ||||
msg = email.Parser.Parser().parse(fileobj) | ||||
Brendan Cully
|
r4777 | subject = msg['Subject'] | ||
Vadim Gelfer
|
r2866 | user = msg['From'] | ||
Patrick Mezard
|
r9573 | if not subject and not user: | ||
# Not an email, restore parsed headers if any | ||||
subject = '\n'.join(': '.join(h) for h in msg.items()) + '\n' | ||||
Vadim Gelfer
|
r2866 | # should try to parse msg['Date'] | ||
date = None | ||||
Brendan Cully
|
r4263 | nodeid = None | ||
Eric Hopper
|
r4443 | branch = None | ||
Brendan Cully
|
r4263 | parents = [] | ||
Vadim Gelfer
|
r2866 | |||
Brendan Cully
|
r4777 | if subject: | ||
if subject.startswith('[PATCH'): | ||||
pend = subject.find(']') | ||||
Brendan Cully
|
r4208 | if pend >= 0: | ||
Matt Mackall
|
r10282 | subject = subject[pend + 1:].lstrip() | ||
Steffen Daode Nurpmeso
|
r15158 | subject = re.sub(r'\n[ \t]+', ' ', subject) | ||
Brendan Cully
|
r4777 | ui.debug('Subject: %s\n' % subject) | ||
Vadim Gelfer
|
r2866 | if user: | ||
ui.debug('From: %s\n' % user) | ||||
diffs_seen = 0 | ||||
ok_types = ('text/plain', 'text/x-diff', 'text/x-patch') | ||||
Bryan O'Sullivan
|
r4900 | message = '' | ||
Vadim Gelfer
|
r2866 | for part in msg.walk(): | ||
content_type = part.get_content_type() | ||||
ui.debug('Content-Type: %s\n' % content_type) | ||||
if content_type not in ok_types: | ||||
continue | ||||
payload = part.get_payload(decode=True) | ||||
m = diffre.search(payload) | ||||
if m: | ||||
Brendan Cully
|
r4220 | hgpatch = False | ||
Mads Kiilerich
|
r12645 | hgpatchheader = False | ||
Brendan Cully
|
r4220 | ignoretext = False | ||
Martin Geisler
|
r9467 | ui.debug('found patch at byte %d\n' % m.start(0)) | ||
Vadim Gelfer
|
r2866 | diffs_seen += 1 | ||
cfp = cStringIO.StringIO() | ||||
for line in payload[:m.start(0)].splitlines(): | ||||
Mads Kiilerich
|
r12728 | if line.startswith('# HG changeset patch') and not hgpatch: | ||
Martin Geisler
|
r9467 | ui.debug('patch generated by hg export\n') | ||
Mads Kiilerich
|
r12728 | hgpatch = True | ||
Mads Kiilerich
|
r12645 | hgpatchheader = True | ||
Vadim Gelfer
|
r2866 | # drop earlier commit message content | ||
cfp.seek(0) | ||||
cfp.truncate() | ||||
Brendan Cully
|
r4778 | subject = None | ||
Mads Kiilerich
|
r12645 | elif hgpatchheader: | ||
Vadim Gelfer
|
r2866 | if line.startswith('# User '): | ||
user = line[7:] | ||||
ui.debug('From: %s\n' % user) | ||||
elif line.startswith("# Date "): | ||||
date = line[7:] | ||||
Eric Hopper
|
r4443 | elif line.startswith("# Branch "): | ||
branch = line[9:] | ||||
Brendan Cully
|
r4263 | elif line.startswith("# Node ID "): | ||
nodeid = line[10:] | ||||
elif line.startswith("# Parent "): | ||||
Patrick Mezard
|
r16475 | parents.append(line[9:].lstrip()) | ||
Mads Kiilerich
|
r12645 | elif not line.startswith("# "): | ||
hgpatchheader = False | ||||
Matt Mackall
|
r19513 | elif line == '---': | ||
Brendan Cully
|
r4220 | ignoretext = True | ||
Mads Kiilerich
|
r12645 | if not hgpatchheader and not ignoretext: | ||
Vadim Gelfer
|
r2866 | cfp.write(line) | ||
cfp.write('\n') | ||||
message = cfp.getvalue() | ||||
if tmpfp: | ||||
tmpfp.write(payload) | ||||
if not payload.endswith('\n'): | ||||
tmpfp.write('\n') | ||||
elif not diffs_seen and message and content_type == 'text/plain': | ||||
message += '\n' + payload | ||||
Brodie Rao
|
r16705 | except: # re-raises | ||
Vadim Gelfer
|
r2866 | tmpfp.close() | ||
os.unlink(tmpname) | ||||
raise | ||||
Brendan Cully
|
r4777 | if subject and not message.startswith(subject): | ||
message = '%s\n%s' % (subject, message) | ||||
Vadim Gelfer
|
r2866 | tmpfp.close() | ||
if not diffs_seen: | ||||
os.unlink(tmpname) | ||||
Eric Hopper
|
r4443 | return None, message, user, date, branch, None, None, None | ||
Jordi Gutiérrez Hermoso
|
r24306 | |||
if parents: | ||||
p1 = parents.pop(0) | ||||
else: | ||||
p1 = None | ||||
if parents: | ||||
p2 = parents.pop(0) | ||||
else: | ||||
p2 = None | ||||
Eric Hopper
|
r4443 | return tmpname, message, user, date, branch, nodeid, p1, p2 | ||
Brendan Cully
|
r2861 | |||
Benoit Boissinot
|
r8778 | class patchmeta(object): | ||
Patrick Mezard
|
r7148 | """Patched file metadata | ||
'op' is the performed operation within ADD, DELETE, RENAME, MODIFY | ||||
or COPY. 'path' is patched file path. 'oldpath' is set to the | ||||
Patrick Mezard
|
r7149 | origin file when 'op' is either COPY or RENAME, None otherwise. If | ||
file mode is changed, 'mode' is a tuple (islink, isexec) where | ||||
'islink' is True if the file is a symlink and 'isexec' is True if | ||||
the file is executable. Otherwise, 'mode' is None. | ||||
Patrick Mezard
|
r7148 | """ | ||
def __init__(self, path): | ||||
self.path = path | ||||
self.oldpath = None | ||||
self.mode = None | ||||
self.op = 'MODIFY' | ||||
self.binary = False | ||||
Patrick Mezard
|
r7149 | def setmode(self, mode): | ||
islink = mode & 020000 | ||||
isexec = mode & 0100 | ||||
self.mode = (islink, isexec) | ||||
Patrick Mezard
|
r14566 | def copy(self): | ||
other = patchmeta(self.path) | ||||
other.oldpath = self.oldpath | ||||
other.mode = self.mode | ||||
other.op = self.op | ||||
other.binary = self.binary | ||||
return other | ||||
Patrick Mezard
|
r16506 | def _ispatchinga(self, afile): | ||
if afile == '/dev/null': | ||||
return self.op == 'ADD' | ||||
return afile == 'a/' + (self.oldpath or self.path) | ||||
def _ispatchingb(self, bfile): | ||||
if bfile == '/dev/null': | ||||
return self.op == 'DELETE' | ||||
return bfile == 'b/' + self.path | ||||
def ispatching(self, afile, bfile): | ||||
return self._ispatchinga(afile) and self._ispatchingb(bfile) | ||||
Mads Kiilerich
|
r11018 | def __repr__(self): | ||
return "<patchmeta %s %r>" % (self.op, self.path) | ||||
Patrick Mezard
|
r7152 | def readgitpatch(lr): | ||
Brendan Cully
|
r2861 | """extract git-style metadata about patches from <patchname>""" | ||
Thomas Arendsen Hein
|
r3223 | |||
Brendan Cully
|
r2861 | # Filter patch for git information | ||
gp = None | ||||
gitpatches = [] | ||||
Patrick Mezard
|
r7152 | for line in lr: | ||
Bill Barry
|
r9243 | line = line.rstrip(' \r\n') | ||
Sean Farley
|
r18830 | if line.startswith('diff --git a/'): | ||
Brendan Cully
|
r2861 | m = gitre.match(line) | ||
if m: | ||||
if gp: | ||||
gitpatches.append(gp) | ||||
Nicolas Dumazet
|
r9392 | dst = m.group(2) | ||
Patrick Mezard
|
r7148 | gp = patchmeta(dst) | ||
Brendan Cully
|
r2861 | elif gp: | ||
if line.startswith('--- '): | ||||
gitpatches.append(gp) | ||||
gp = None | ||||
continue | ||||
if line.startswith('rename from '): | ||||
gp.op = 'RENAME' | ||||
Bill Barry
|
r9243 | gp.oldpath = line[12:] | ||
Brendan Cully
|
r2861 | elif line.startswith('rename to '): | ||
Bill Barry
|
r9243 | gp.path = line[10:] | ||
Brendan Cully
|
r2861 | elif line.startswith('copy from '): | ||
gp.op = 'COPY' | ||||
Bill Barry
|
r9243 | gp.oldpath = line[10:] | ||
Brendan Cully
|
r2861 | elif line.startswith('copy to '): | ||
Bill Barry
|
r9243 | gp.path = line[8:] | ||
Brendan Cully
|
r2861 | elif line.startswith('deleted file'): | ||
gp.op = 'DELETE' | ||||
elif line.startswith('new file mode '): | ||||
gp.op = 'ADD' | ||||
Bill Barry
|
r9243 | gp.setmode(int(line[-6:], 8)) | ||
Brendan Cully
|
r2861 | elif line.startswith('new mode '): | ||
Bill Barry
|
r9243 | gp.setmode(int(line[-6:], 8)) | ||
Brendan Cully
|
r3367 | elif line.startswith('GIT binary patch'): | ||
gp.binary = True | ||||
Brendan Cully
|
r2861 | if gp: | ||
gitpatches.append(gp) | ||||
Patrick Mezard
|
r12669 | return gitpatches | ||
Brendan Cully
|
r2861 | |||
Simon Heimberg
|
r8891 | class linereader(object): | ||
Patrick Mezard
|
r8810 | # simple class to allow pushing lines back into the input stream | ||
Patrick Mezard
|
r14418 | def __init__(self, fp): | ||
Patrick Mezard
|
r8810 | self.fp = fp | ||
self.buf = [] | ||||
def push(self, line): | ||||
if line is not None: | ||||
self.buf.append(line) | ||||
def readline(self): | ||||
if self.buf: | ||||
l = self.buf[0] | ||||
del self.buf[0] | ||||
return l | ||||
Patrick Mezard
|
r14418 | return self.fp.readline() | ||
Patrick Mezard
|
r8810 | |||
def __iter__(self): | ||||
Martin Geisler
|
r14494 | while True: | ||
Patrick Mezard
|
r8810 | l = self.readline() | ||
if not l: | ||||
break | ||||
yield l | ||||
Patrick Mezard
|
r14348 | class abstractbackend(object): | ||
def __init__(self, ui): | ||||
Bryan O'Sullivan
|
r4897 | self.ui = ui | ||
Patrick Mezard
|
r14348 | |||
Patrick Mezard
|
r14391 | def getfile(self, fname): | ||
"""Return target file data and flags as a (data, (islink, | ||||
Mads Kiilerich
|
r22296 | isexec)) tuple. Data is None if file is missing/deleted. | ||
Patrick Mezard
|
r14348 | """ | ||
raise NotImplementedError | ||||
Patrick Mezard
|
r14452 | def setfile(self, fname, data, mode, copysource): | ||
Patrick Mezard
|
r14391 | """Write data to target file fname and set its mode. mode is a | ||
(islink, isexec) tuple. If data is None, the file content should | ||||
Patrick Mezard
|
r14452 | be left unchanged. If the file is modified after being copied, | ||
copysource is set to the original file name. | ||||
Patrick Mezard
|
r14367 | """ | ||
Patrick Mezard
|
r14348 | raise NotImplementedError | ||
Patrick Mezard
|
r5652 | |||
Patrick Mezard
|
r14348 | def unlink(self, fname): | ||
"""Unlink target file.""" | ||||
raise NotImplementedError | ||||
def writerej(self, fname, failed, total, lines): | ||||
"""Write rejected lines for fname. total is the number of hunks | ||||
which failed to apply and total the total number of hunks for this | ||||
files. | ||||
""" | ||||
pass | ||||
Patrick Mezard
|
r14351 | def exists(self, fname): | ||
raise NotImplementedError | ||||
Patrick Mezard
|
r14348 | class fsbackend(abstractbackend): | ||
Patrick Mezard
|
r14350 | def __init__(self, ui, basedir): | ||
Patrick Mezard
|
r14348 | super(fsbackend, self).__init__(ui) | ||
Patrick Mezard
|
r14350 | self.opener = scmutil.opener(basedir) | ||
Bryan O'Sullivan
|
r4897 | |||
Patrick Mezard
|
r14366 | def _join(self, f): | ||
return os.path.join(self.opener.base, f) | ||||
Patrick Mezard
|
r14391 | def getfile(self, fname): | ||
Chinmay Joshi
|
r21717 | if self.opener.islink(fname): | ||
return (self.opener.readlink(fname), (True, False)) | ||||
Patrick Mezard
|
r14531 | isexec = False | ||
Patrick Mezard
|
r7392 | try: | ||
Chinmay Joshi
|
r21717 | isexec = self.opener.lstat(fname).st_mode & 0100 != 0 | ||
Patrick Mezard
|
r14391 | except OSError, e: | ||
if e.errno != errno.ENOENT: | ||||
raise | ||||
Mads Kiilerich
|
r22296 | try: | ||
return (self.opener.read(fname), (False, isexec)) | ||||
except IOError, e: | ||||
if e.errno != errno.ENOENT: | ||||
raise | ||||
return None, None | ||||
Patrick Mezard
|
r7392 | |||
Patrick Mezard
|
r14452 | def setfile(self, fname, data, mode, copysource): | ||
Patrick Mezard
|
r14391 | islink, isexec = mode | ||
if data is None: | ||||
Chinmay Joshi
|
r21717 | self.opener.setflags(fname, islink, isexec) | ||
Patrick Mezard
|
r14390 | return | ||
Patrick Mezard
|
r14391 | if islink: | ||
self.opener.symlink(data, fname) | ||||
Patrick Mezard
|
r14367 | else: | ||
Patrick Mezard
|
r14391 | self.opener.write(fname, data) | ||
Patrick Mezard
|
r14367 | if isexec: | ||
Chinmay Joshi
|
r21717 | self.opener.setflags(fname, False, True) | ||
Patrick Mezard
|
r7392 | |||
def unlink(self, fname): | ||||
Chinmay Joshi
|
r21717 | self.opener.unlinkpath(fname, ignoremissing=True) | ||
Patrick Mezard
|
r7392 | |||
Patrick Mezard
|
r14348 | def writerej(self, fname, failed, total, lines): | ||
fname = fname + ".rej" | ||||
self.ui.warn( | ||||
_("%d out of %d hunks FAILED -- saving rejects to file %s\n") % | ||||
(failed, total, fname)) | ||||
fp = self.opener(fname, 'w') | ||||
fp.writelines(lines) | ||||
fp.close() | ||||
Patrick Mezard
|
r14351 | def exists(self, fname): | ||
Chinmay Joshi
|
r21717 | return self.opener.lexists(fname) | ||
Patrick Mezard
|
r14351 | |||
Patrick Mezard
|
r14370 | class workingbackend(fsbackend): | ||
def __init__(self, ui, repo, similarity): | ||||
super(workingbackend, self).__init__(ui, repo.root) | ||||
self.repo = repo | ||||
self.similarity = similarity | ||||
self.removed = set() | ||||
self.changed = set() | ||||
self.copied = [] | ||||
Patrick Mezard
|
r14453 | def _checkknown(self, fname): | ||
if self.repo.dirstate[fname] == '?' and self.exists(fname): | ||||
raise PatchError(_('cannot patch %s: file is not tracked') % fname) | ||||
Patrick Mezard
|
r14452 | def setfile(self, fname, data, mode, copysource): | ||
Patrick Mezard
|
r14453 | self._checkknown(fname) | ||
Patrick Mezard
|
r14452 | super(workingbackend, self).setfile(fname, data, mode, copysource) | ||
if copysource is not None: | ||||
self.copied.append((copysource, fname)) | ||||
Patrick Mezard
|
r14370 | self.changed.add(fname) | ||
def unlink(self, fname): | ||||
Patrick Mezard
|
r14453 | self._checkknown(fname) | ||
Patrick Mezard
|
r14370 | super(workingbackend, self).unlink(fname) | ||
self.removed.add(fname) | ||||
self.changed.add(fname) | ||||
def close(self): | ||||
wctx = self.repo[None] | ||||
Siddharth Agarwal
|
r19155 | changed = set(self.changed) | ||
Patrick Mezard
|
r14370 | for src, dst in self.copied: | ||
scmutil.dirstatecopy(self.ui, self.repo, wctx, src, dst) | ||||
Patrick Mezard
|
r16112 | if self.removed: | ||
Matt Mackall
|
r14435 | wctx.forget(sorted(self.removed)) | ||
Patrick Mezard
|
r16112 | for f in self.removed: | ||
if f not in self.repo.dirstate: | ||||
# File was deleted and no longer belongs to the | ||||
# dirstate, it was probably marked added then | ||||
# deleted, and should not be considered by | ||||
Siddharth Agarwal
|
r19155 | # marktouched(). | ||
changed.discard(f) | ||||
if changed: | ||||
scmutil.marktouched(self.repo, changed, self.similarity) | ||||
Patrick Mezard
|
r14370 | return sorted(self.changed) | ||
Patrick Mezard
|
r14452 | class filestore(object): | ||
Patrick Mezard
|
r14658 | def __init__(self, maxsize=None): | ||
Patrick Mezard
|
r14452 | self.opener = None | ||
self.files = {} | ||||
self.created = 0 | ||||
Patrick Mezard
|
r14658 | self.maxsize = maxsize | ||
if self.maxsize is None: | ||||
self.maxsize = 4*(2**20) | ||||
self.size = 0 | ||||
self.data = {} | ||||
Patrick Mezard
|
r14452 | |||
Patrick Mezard
|
r14609 | def setfile(self, fname, data, mode, copied=None): | ||
Patrick Mezard
|
r14658 | if self.maxsize < 0 or (len(data) + self.size) <= self.maxsize: | ||
self.data[fname] = (data, mode, copied) | ||||
self.size += len(data) | ||||
else: | ||||
if self.opener is None: | ||||
root = tempfile.mkdtemp(prefix='hg-patch-') | ||||
self.opener = scmutil.opener(root) | ||||
# Avoid filename issues with these simple names | ||||
fn = str(self.created) | ||||
self.opener.write(fn, data) | ||||
self.created += 1 | ||||
self.files[fname] = (fn, mode, copied) | ||||
Patrick Mezard
|
r14452 | |||
def getfile(self, fname): | ||||
Patrick Mezard
|
r14658 | if fname in self.data: | ||
return self.data[fname] | ||||
if not self.opener or fname not in self.files: | ||||
Mads Kiilerich
|
r22296 | return None, None, None | ||
Patrick Mezard
|
r14609 | fn, mode, copied = self.files[fname] | ||
return self.opener.read(fn), mode, copied | ||||
Patrick Mezard
|
r14452 | |||
def close(self): | ||||
if self.opener: | ||||
shutil.rmtree(self.opener.base) | ||||
Patrick Mezard
|
r14611 | class repobackend(abstractbackend): | ||
def __init__(self, ui, repo, ctx, store): | ||||
super(repobackend, self).__init__(ui) | ||||
self.repo = repo | ||||
self.ctx = ctx | ||||
self.store = store | ||||
self.changed = set() | ||||
self.removed = set() | ||||
self.copied = {} | ||||
def _checkknown(self, fname): | ||||
if fname not in self.ctx: | ||||
raise PatchError(_('cannot patch %s: file is not tracked') % fname) | ||||
def getfile(self, fname): | ||||
try: | ||||
fctx = self.ctx[fname] | ||||
except error.LookupError: | ||||
Mads Kiilerich
|
r22296 | return None, None | ||
Patrick Mezard
|
r14611 | flags = fctx.flags() | ||
return fctx.data(), ('l' in flags, 'x' in flags) | ||||
def setfile(self, fname, data, mode, copysource): | ||||
if copysource: | ||||
self._checkknown(copysource) | ||||
if data is None: | ||||
data = self.ctx[fname].data() | ||||
self.store.setfile(fname, data, mode, copysource) | ||||
self.changed.add(fname) | ||||
if copysource: | ||||
self.copied[fname] = copysource | ||||
def unlink(self, fname): | ||||
self._checkknown(fname) | ||||
self.removed.add(fname) | ||||
def exists(self, fname): | ||||
return fname in self.ctx | ||||
def close(self): | ||||
return self.changed | self.removed | ||||
Patrick Mezard
|
r14348 | # @@ -start,len +start,len @@ or @@ -start +start @@ if len is 1 | ||
Patrick Mezard
|
r15510 | unidesc = re.compile('@@ -(\d+)(?:,(\d+))? \+(\d+)(?:,(\d+))? @@') | ||
contextdesc = re.compile('(?:---|\*\*\*) (\d+)(?:,(\d+))? (?:---|\*\*\*)') | ||||
Patrick Mezard
|
r14348 | eolmodes = ['strict', 'crlf', 'lf', 'auto'] | ||
class patchfile(object): | ||||
Patrick Mezard
|
r14566 | def __init__(self, ui, gp, backend, store, eolmode='strict'): | ||
self.fname = gp.path | ||||
Patrick Mezard
|
r14348 | self.eolmode = eolmode | ||
self.eol = None | ||||
self.backend = backend | ||||
self.ui = ui | ||||
self.lines = [] | ||||
self.exists = False | ||||
Patrick Mezard
|
r14452 | self.missing = True | ||
Patrick Mezard
|
r14566 | self.mode = gp.mode | ||
self.copysource = gp.oldpath | ||||
self.create = gp.op in ('ADD', 'COPY', 'RENAME') | ||||
self.remove = gp.op == 'DELETE' | ||||
Mads Kiilerich
|
r22296 | if self.copysource is None: | ||
data, mode = backend.getfile(self.fname) | ||||
else: | ||||
data, mode = store.getfile(self.copysource)[:2] | ||||
if data is not None: | ||||
self.exists = self.copysource is None or backend.exists(self.fname) | ||||
Patrick Mezard
|
r14452 | self.missing = False | ||
if data: | ||||
Wagner Bruna
|
r14832 | self.lines = mdiff.splitnewlines(data) | ||
Patrick Mezard
|
r14452 | if self.mode is None: | ||
self.mode = mode | ||||
if self.lines: | ||||
# Normalize line endings | ||||
if self.lines[0].endswith('\r\n'): | ||||
self.eol = '\r\n' | ||||
elif self.lines[0].endswith('\n'): | ||||
self.eol = '\n' | ||||
if eolmode != 'strict': | ||||
nlines = [] | ||||
for l in self.lines: | ||||
if l.endswith('\r\n'): | ||||
l = l[:-2] + '\n' | ||||
nlines.append(l) | ||||
self.lines = nlines | ||||
Mads Kiilerich
|
r22296 | else: | ||
Patrick Mezard
|
r14566 | if self.create: | ||
Patrick Mezard
|
r14452 | self.missing = False | ||
if self.mode is None: | ||||
self.mode = (False, False) | ||||
if self.missing: | ||||
Mads Kiilerich
|
r17299 | self.ui.warn(_("unable to find '%s' for patching\n") % self.fname) | ||
Patrick Mezard
|
r14348 | |||
self.hash = {} | ||||
self.dirty = 0 | ||||
self.offset = 0 | ||||
self.skew = 0 | ||||
self.rej = [] | ||||
self.fileprinted = False | ||||
self.printfile(False) | ||||
self.hunks = 0 | ||||
Patrick Mezard
|
r14367 | def writelines(self, fname, lines, mode): | ||
Patrick Mezard
|
r14348 | if self.eolmode == 'auto': | ||
eol = self.eol | ||||
elif self.eolmode == 'crlf': | ||||
eol = '\r\n' | ||||
else: | ||||
eol = '\n' | ||||
if self.eolmode != 'strict' and eol and eol != '\n': | ||||
rawlines = [] | ||||
for l in lines: | ||||
if l and l[-1] == '\n': | ||||
l = l[:-1] + eol | ||||
rawlines.append(l) | ||||
lines = rawlines | ||||
Patrick Mezard
|
r14452 | self.backend.setfile(fname, ''.join(lines), mode, self.copysource) | ||
Patrick Mezard
|
r14348 | |||
Bryan O'Sullivan
|
r4897 | def printfile(self, warn): | ||
if self.fileprinted: | ||||
return | ||||
if warn or self.ui.verbose: | ||||
self.fileprinted = True | ||||
Bryan O'Sullivan
|
r4898 | s = _("patching file %s\n") % self.fname | ||
Bryan O'Sullivan
|
r4897 | if warn: | ||
self.ui.warn(s) | ||||
else: | ||||
self.ui.note(s) | ||||
def findlines(self, l, linenum): | ||||
# looks through the hash and finds candidate lines. The | ||||
# result is a list of line numbers sorted based on distance | ||||
# from linenum | ||||
Thomas Arendsen Hein
|
r5143 | |||
Benoit Boissinot
|
r9681 | cand = self.hash.get(l, []) | ||
Bryan O'Sullivan
|
r4897 | if len(cand) > 1: | ||
# resort our list of potentials forward then back. | ||||
Alejandro Santos
|
r9032 | cand.sort(key=lambda x: abs(x - linenum)) | ||
Bryan O'Sullivan
|
r4897 | return cand | ||
def write_rej(self): | ||||
# our rejects are a little different from patch(1). This always | ||||
# creates rejects in the same form as the original patch. A file | ||||
# header is inserted so that you can run the reject through patch again | ||||
# without having to type the filename. | ||||
if not self.rej: | ||||
return | ||||
Patrick Mezard
|
r14349 | base = os.path.basename(self.fname) | ||
lines = ["--- %s\n+++ %s\n" % (base, base)] | ||||
for x in self.rej: | ||||
for l in x.hunk: | ||||
lines.append(l) | ||||
if l[-1] != '\n': | ||||
lines.append("\n\ No newline at end of file\n") | ||||
self.backend.writerej(self.fname, len(self.rej), self.hunks, lines) | ||||
Bryan O'Sullivan
|
r4897 | |||
Nicolas Dumazet
|
r9393 | def apply(self, h): | ||
Bryan O'Sullivan
|
r4897 | if not h.complete(): | ||
Bryan O'Sullivan
|
r4898 | raise PatchError(_("bad hunk #%d %s (%d %d %d %d)") % | ||
Bryan O'Sullivan
|
r4897 | (h.number, h.desc, len(h.a), h.lena, len(h.b), | ||
h.lenb)) | ||||
self.hunks += 1 | ||||
Patrick Mezard
|
r5652 | if self.missing: | ||
self.rej.append(h) | ||||
return -1 | ||||
Patrick Mezard
|
r14451 | if self.exists and self.create: | ||
Patrick Mezard
|
r14452 | if self.copysource: | ||
self.ui.warn(_("cannot create %s: destination already " | ||||
FUJIWARA Katsunori
|
r20869 | "exists\n") % self.fname) | ||
Patrick Mezard
|
r14452 | else: | ||
self.ui.warn(_("file %s already exists\n") % self.fname) | ||||
Bryan O'Sullivan
|
r4897 | self.rej.append(h) | ||
return -1 | ||||
Patrick Mezard
|
r9585 | if isinstance(h, binhunk): | ||
Patrick Mezard
|
r14451 | if self.remove: | ||
Patrick Mezard
|
r14348 | self.backend.unlink(self.fname) | ||
Bryan O'Sullivan
|
r4897 | else: | ||
Nicolas Vigier
|
r20137 | l = h.new(self.lines) | ||
self.lines[:] = l | ||||
self.offset += len(l) | ||||
Martin Geisler
|
r14217 | self.dirty = True | ||
Bryan O'Sullivan
|
r4897 | return 0 | ||
Patrick Mezard
|
r10127 | horig = h | ||
Patrick Mezard
|
r10128 | if (self.eolmode in ('crlf', 'lf') | ||
or self.eolmode == 'auto' and self.eol): | ||||
# If new eols are going to be normalized, then normalize | ||||
# hunk data before patching. Otherwise, preserve input | ||||
# line-endings. | ||||
Patrick Mezard
|
r10127 | h = h.getnormalized() | ||
Bryan O'Sullivan
|
r4897 | # fast case first, no offsets, no fuzz | ||
Patrick Mezard
|
r16122 | old, oldstart, new, newstart = h.fuzzit(0, False) | ||
oldstart += self.offset | ||||
orig_start = oldstart | ||||
Greg Onufer
|
r10135 | # if there's skew we want to emit the "(offset %d lines)" even | ||
# when the hunk cleanly applies at start + skew, so skip the | ||||
# fast case code | ||||
Patrick Mezard
|
r16122 | if (self.skew == 0 and | ||
diffhelpers.testhunk(old, self.lines, oldstart) == 0): | ||||
Patrick Mezard
|
r14451 | if self.remove: | ||
Patrick Mezard
|
r14348 | self.backend.unlink(self.fname) | ||
Bryan O'Sullivan
|
r4897 | else: | ||
Patrick Mezard
|
r16122 | self.lines[oldstart:oldstart + len(old)] = new | ||
self.offset += len(new) - len(old) | ||||
Martin Geisler
|
r14217 | self.dirty = True | ||
Bryan O'Sullivan
|
r4897 | return 0 | ||
Patrick Mezard
|
r13700 | # ok, we couldn't match the hunk. Lets look for offsets and fuzz it | ||
self.hash = {} | ||||
for x, s in enumerate(self.lines): | ||||
self.hash.setdefault(s, []).append(x) | ||||
Bryan O'Sullivan
|
r4897 | |||
for fuzzlen in xrange(3): | ||||
Matt Mackall
|
r10282 | for toponly in [True, False]: | ||
Patrick Mezard
|
r16122 | old, oldstart, new, newstart = h.fuzzit(fuzzlen, toponly) | ||
Patrick Mezard
|
r16123 | oldstart = oldstart + self.offset + self.skew | ||
oldstart = min(oldstart, len(self.lines)) | ||||
if old: | ||||
cand = self.findlines(old[0][1:], oldstart) | ||||
else: | ||||
# Only adding lines with no or fuzzed context, just | ||||
# take the skew in account | ||||
cand = [oldstart] | ||||
Bryan O'Sullivan
|
r4897 | |||
for l in cand: | ||||
Patrick Mezard
|
r16123 | if not old or diffhelpers.testhunk(old, self.lines, l) == 0: | ||
Patrick Mezard
|
r16121 | self.lines[l : l + len(old)] = new | ||
self.offset += len(new) - len(old) | ||||
Greg Onufer
|
r10135 | self.skew = l - orig_start | ||
Martin Geisler
|
r14217 | self.dirty = True | ||
Wagner Bruna
|
r10518 | offset = l - orig_start - fuzzlen | ||
Bryan O'Sullivan
|
r4897 | if fuzzlen: | ||
Wagner Bruna
|
r10518 | msg = _("Hunk #%d succeeded at %d " | ||
"with fuzz %d " | ||||
"(offset %d lines).\n") | ||||
Bryan O'Sullivan
|
r4897 | self.printfile(True) | ||
Wagner Bruna
|
r10518 | self.ui.warn(msg % | ||
(h.number, l + 1, fuzzlen, offset)) | ||||
Bryan O'Sullivan
|
r4897 | else: | ||
Wagner Bruna
|
r10518 | msg = _("Hunk #%d succeeded at %d " | ||
Wagner Bruna
|
r8090 | "(offset %d lines).\n") | ||
Wagner Bruna
|
r10518 | self.ui.note(msg % (h.number, l + 1, offset)) | ||
Bryan O'Sullivan
|
r4897 | return fuzzlen | ||
self.printfile(True) | ||||
Bryan O'Sullivan
|
r4898 | self.ui.warn(_("Hunk #%d FAILED at %d\n") % (h.number, orig_start)) | ||
Patrick Mezard
|
r10127 | self.rej.append(horig) | ||
Bryan O'Sullivan
|
r4897 | return -1 | ||
Patrick Mezard
|
r13701 | def close(self): | ||
if self.dirty: | ||||
Patrick Mezard
|
r14367 | self.writelines(self.fname, self.lines, self.mode) | ||
Patrick Mezard
|
r13701 | self.write_rej() | ||
return len(self.rej) | ||||
Laurent Charignon
|
r24261 | class header(object): | ||
"""patch header | ||||
""" | ||||
diffgit_re = re.compile('diff --git a/(.*) b/(.*)$') | ||||
diff_re = re.compile('diff -r .* (.*)$') | ||||
Laurent Charignon
|
r24845 | allhunks_re = re.compile('(?:index|deleted file) ') | ||
Laurent Charignon
|
r24261 | pretty_re = re.compile('(?:new file|deleted file) ') | ||
Laurent Charignon
|
r24845 | special_re = re.compile('(?:index|deleted|copy|rename) ') | ||
newfile_re = re.compile('(?:new file)') | ||||
Laurent Charignon
|
r24261 | |||
def __init__(self, header): | ||||
self.header = header | ||||
self.hunks = [] | ||||
def binary(self): | ||||
Augie Fackler
|
r25149 | return any(h.startswith('index ') for h in self.header) | ||
Laurent Charignon
|
r24261 | |||
def pretty(self, fp): | ||||
for h in self.header: | ||||
if h.startswith('index '): | ||||
fp.write(_('this modifies a binary file (all or nothing)\n')) | ||||
break | ||||
if self.pretty_re.match(h): | ||||
fp.write(h) | ||||
if self.binary(): | ||||
fp.write(_('this is a binary file\n')) | ||||
break | ||||
if h.startswith('---'): | ||||
fp.write(_('%d hunks, %d lines changed\n') % | ||||
(len(self.hunks), | ||||
sum([max(h.added, h.removed) for h in self.hunks]))) | ||||
break | ||||
fp.write(h) | ||||
def write(self, fp): | ||||
fp.write(''.join(self.header)) | ||||
def allhunks(self): | ||||
Augie Fackler
|
r25149 | return any(self.allhunks_re.match(h) for h in self.header) | ||
Laurent Charignon
|
r24261 | |||
def files(self): | ||||
match = self.diffgit_re.match(self.header[0]) | ||||
if match: | ||||
fromfile, tofile = match.groups() | ||||
if fromfile == tofile: | ||||
return [fromfile] | ||||
return [fromfile, tofile] | ||||
else: | ||||
return self.diff_re.match(self.header[0]).groups() | ||||
def filename(self): | ||||
return self.files()[-1] | ||||
def __repr__(self): | ||||
return '<header %s>' % (' '.join(map(repr, self.files()))) | ||||
Laurent Charignon
|
r24845 | def isnewfile(self): | ||
Augie Fackler
|
r25149 | return any(self.newfile_re.match(h) for h in self.header) | ||
Laurent Charignon
|
r24845 | |||
Laurent Charignon
|
r24261 | def special(self): | ||
Laurent Charignon
|
r24845 | # Special files are shown only at the header level and not at the hunk | ||
# level for example a file that has been deleted is a special file. | ||||
# The user cannot change the content of the operation, in the case of | ||||
# the deleted file he has to take the deletion or not take it, he | ||||
# cannot take some of it. | ||||
# Newly added files are special if they are empty, they are not special | ||||
# if they have some content as we want to be able to change it | ||||
nocontent = len(self.header) == 2 | ||||
emptynewfile = self.isnewfile() and nocontent | ||||
return emptynewfile or \ | ||||
Augie Fackler
|
r25149 | any(self.special_re.match(h) for h in self.header) | ||
Laurent Charignon
|
r24261 | |||
Laurent Charignon
|
r24263 | class recordhunk(object): | ||
"""patch hunk | ||||
XXX shouldn't we merge this with the other hunk class? | ||||
""" | ||||
maxcontext = 3 | ||||
def __init__(self, header, fromline, toline, proc, before, hunk, after): | ||||
def trimcontext(number, lines): | ||||
delta = len(lines) - self.maxcontext | ||||
if False and delta > 0: | ||||
return number + delta, lines[:self.maxcontext] | ||||
return number, lines | ||||
self.header = header | ||||
self.fromline, self.before = trimcontext(fromline, before) | ||||
self.toline, self.after = trimcontext(toline, after) | ||||
self.proc = proc | ||||
self.hunk = hunk | ||||
self.added, self.removed = self.countchanges(self.hunk) | ||||
Laurent Charignon
|
r24346 | def __eq__(self, v): | ||
if not isinstance(v, recordhunk): | ||||
return False | ||||
return ((v.hunk == self.hunk) and | ||||
(v.proc == self.proc) and | ||||
(self.fromline == v.fromline) and | ||||
(self.header.files() == v.header.files())) | ||||
def __hash__(self): | ||||
return hash((tuple(self.hunk), | ||||
tuple(self.header.files()), | ||||
self.fromline, | ||||
self.proc)) | ||||
Laurent Charignon
|
r24263 | def countchanges(self, hunk): | ||
"""hunk -> (n+,n-)""" | ||||
add = len([h for h in hunk if h[0] == '+']) | ||||
rem = len([h for h in hunk if h[0] == '-']) | ||||
return add, rem | ||||
def write(self, fp): | ||||
delta = len(self.before) + len(self.after) | ||||
if self.after and self.after[-1] == '\\ No newline at end of file\n': | ||||
delta -= 1 | ||||
fromlen = delta + self.removed | ||||
tolen = delta + self.added | ||||
fp.write('@@ -%d,%d +%d,%d @@%s\n' % | ||||
(self.fromline, fromlen, self.toline, tolen, | ||||
self.proc and (' ' + self.proc))) | ||||
fp.write(''.join(self.before + self.hunk + self.after)) | ||||
pretty = write | ||||
def filename(self): | ||||
return self.header.filename() | ||||
def __repr__(self): | ||||
return '<hunk %r@%d>' % (self.filename(), self.fromline) | ||||
Laurent Charignon
|
r25310 | def filterpatch(ui, headers, operation=None): | ||
Laurent Charignon
|
r24269 | """Interactively filter patch chunks into applied-only chunks""" | ||
def prompt(skipfile, skipall, query, chunk): | ||||
"""prompt query, and process base inputs | ||||
- y/n for the rest of file | ||||
- y/n for the rest | ||||
- ? (help) | ||||
- q (quit) | ||||
Return True/False and possibly updated skipfile and skipall. | ||||
""" | ||||
newpatches = None | ||||
if skipall is not None: | ||||
return skipall, skipfile, skipall, newpatches | ||||
if skipfile is not None: | ||||
return skipfile, skipfile, skipall, newpatches | ||||
while True: | ||||
resps = _('[Ynesfdaq?]' | ||||
'$$ &Yes, record this change' | ||||
'$$ &No, skip this change' | ||||
'$$ &Edit this change manually' | ||||
'$$ &Skip remaining changes to this file' | ||||
'$$ Record remaining changes to this &file' | ||||
'$$ &Done, skip remaining changes and files' | ||||
'$$ Record &all changes to all remaining files' | ||||
'$$ &Quit, recording no changes' | ||||
'$$ &? (display help)') | ||||
r = ui.promptchoice("%s %s" % (query, resps)) | ||||
ui.write("\n") | ||||
if r == 8: # ? | ||||
for c, t in ui.extractchoices(resps)[1]: | ||||
ui.write('%s - %s\n' % (c, t.lower())) | ||||
continue | ||||
elif r == 0: # yes | ||||
ret = True | ||||
elif r == 1: # no | ||||
ret = False | ||||
elif r == 2: # Edit patch | ||||
if chunk is None: | ||||
ui.write(_('cannot edit patch for whole file')) | ||||
ui.write("\n") | ||||
continue | ||||
if chunk.header.binary(): | ||||
ui.write(_('cannot edit patch for binary file')) | ||||
ui.write("\n") | ||||
continue | ||||
# Patch comment based on the Git one (based on comment at end of | ||||
# http://mercurial.selenic.com/wiki/RecordExtension) | ||||
phelp = '---' + _(""" | ||||
To remove '-' lines, make them ' ' lines (context). | ||||
To remove '+' lines, delete them. | ||||
Lines starting with # will be removed from the patch. | ||||
If the patch applies cleanly, the edited hunk will immediately be | ||||
added to the record list. If it does not apply cleanly, a rejects | ||||
file will be generated: you can use that when you try again. If | ||||
all lines of the hunk are removed, then the edit is aborted and | ||||
the hunk is left unchanged. | ||||
""") | ||||
(patchfd, patchfn) = tempfile.mkstemp(prefix="hg-editor-", | ||||
suffix=".diff", text=True) | ||||
ncpatchfp = None | ||||
try: | ||||
# Write the initial patch | ||||
f = os.fdopen(patchfd, "w") | ||||
chunk.header.write(f) | ||||
chunk.write(f) | ||||
f.write('\n'.join(['# ' + i for i in phelp.splitlines()])) | ||||
f.close() | ||||
# Start the editor and wait for it to complete | ||||
editor = ui.geteditor() | ||||
ui.system("%s \"%s\"" % (editor, patchfn), | ||||
environ={'HGUSER': ui.username()}, | ||||
onerr=util.Abort, errprefix=_("edit failed")) | ||||
# Remove comment lines | ||||
patchfp = open(patchfn) | ||||
ncpatchfp = cStringIO.StringIO() | ||||
for line in patchfp: | ||||
if not line.startswith('#'): | ||||
ncpatchfp.write(line) | ||||
patchfp.close() | ||||
ncpatchfp.seek(0) | ||||
newpatches = parsepatch(ncpatchfp) | ||||
finally: | ||||
os.unlink(patchfn) | ||||
del ncpatchfp | ||||
# Signal that the chunk shouldn't be applied as-is, but | ||||
# provide the new patch to be used instead. | ||||
ret = False | ||||
elif r == 3: # Skip | ||||
ret = skipfile = False | ||||
elif r == 4: # file (Record remaining) | ||||
ret = skipfile = True | ||||
elif r == 5: # done, skip remaining | ||||
ret = skipall = False | ||||
elif r == 6: # all | ||||
ret = skipall = True | ||||
elif r == 7: # quit | ||||
raise util.Abort(_('user quit')) | ||||
return ret, skipfile, skipall, newpatches | ||||
seen = set() | ||||
applied = {} # 'filename' -> [] of chunks | ||||
skipfile, skipall = None, None | ||||
pos, total = 1, sum(len(h.hunks) for h in headers) | ||||
for h in headers: | ||||
pos += len(h.hunks) | ||||
skipfile = None | ||||
fixoffset = 0 | ||||
hdr = ''.join(h.header) | ||||
if hdr in seen: | ||||
continue | ||||
seen.add(hdr) | ||||
if skipall is None: | ||||
h.pretty(ui) | ||||
msg = (_('examine changes to %s?') % | ||||
_(' and ').join("'%s'" % f for f in h.files())) | ||||
r, skipfile, skipall, np = prompt(skipfile, skipall, msg, None) | ||||
if not r: | ||||
continue | ||||
applied[h.filename()] = [h] | ||||
if h.allhunks(): | ||||
applied[h.filename()] += h.hunks | ||||
continue | ||||
for i, chunk in enumerate(h.hunks): | ||||
if skipfile is None and skipall is None: | ||||
chunk.pretty(ui) | ||||
if total == 1: | ||||
msg = _("record this change to '%s'?") % chunk.filename() | ||||
else: | ||||
idx = pos - len(h.hunks) + i | ||||
msg = _("record change %d/%d to '%s'?") % (idx, total, | ||||
chunk.filename()) | ||||
r, skipfile, skipall, newpatches = prompt(skipfile, | ||||
skipall, msg, chunk) | ||||
if r: | ||||
if fixoffset: | ||||
chunk = copy.copy(chunk) | ||||
chunk.toline += fixoffset | ||||
applied[chunk.filename()].append(chunk) | ||||
elif newpatches is not None: | ||||
for newpatch in newpatches: | ||||
for newhunk in newpatch.hunks: | ||||
if fixoffset: | ||||
newhunk.toline += fixoffset | ||||
applied[newhunk.filename()].append(newhunk) | ||||
else: | ||||
fixoffset += chunk.removed - chunk.added | ||||
return sum([h for h in applied.itervalues() | ||||
if h[0].special() or len(h) > 1], []) | ||||
Benoit Boissinot
|
r8778 | class hunk(object): | ||
Patrick Mezard
|
r14451 | def __init__(self, desc, num, lr, context): | ||
Bryan O'Sullivan
|
r4897 | self.number = num | ||
self.desc = desc | ||||
Matt Mackall
|
r10282 | self.hunk = [desc] | ||
Bryan O'Sullivan
|
r4897 | self.a = [] | ||
self.b = [] | ||||
Benoit Boissinot
|
r9682 | self.starta = self.lena = None | ||
self.startb = self.lenb = None | ||||
Patrick Mezard
|
r10127 | if lr is not None: | ||
if context: | ||||
self.read_context_hunk(lr) | ||||
else: | ||||
self.read_unified_hunk(lr) | ||||
Bryan O'Sullivan
|
r4897 | |||
Patrick Mezard
|
r10127 | def getnormalized(self): | ||
"""Return a copy with line endings normalized to LF.""" | ||||
def normalize(lines): | ||||
nlines = [] | ||||
for line in lines: | ||||
if line.endswith('\r\n'): | ||||
line = line[:-2] + '\n' | ||||
nlines.append(line) | ||||
return nlines | ||||
# Dummy object, it is rebuilt manually | ||||
Patrick Mezard
|
r14451 | nh = hunk(self.desc, self.number, None, None) | ||
Patrick Mezard
|
r10127 | nh.number = self.number | ||
nh.desc = self.desc | ||||
Patrick Mezard
|
r10524 | nh.hunk = self.hunk | ||
Patrick Mezard
|
r10127 | nh.a = normalize(self.a) | ||
nh.b = normalize(self.b) | ||||
nh.starta = self.starta | ||||
nh.startb = self.startb | ||||
nh.lena = self.lena | ||||
nh.lenb = self.lenb | ||||
return nh | ||||
Bryan O'Sullivan
|
r4897 | def read_unified_hunk(self, lr): | ||
m = unidesc.match(self.desc) | ||||
if not m: | ||||
Bryan O'Sullivan
|
r4898 | raise PatchError(_("bad hunk #%d") % self.number) | ||
Patrick Mezard
|
r15510 | self.starta, self.lena, self.startb, self.lenb = m.groups() | ||
Martin Geisler
|
r8527 | if self.lena is None: | ||
Bryan O'Sullivan
|
r4897 | self.lena = 1 | ||
else: | ||||
self.lena = int(self.lena) | ||||
Martin Geisler
|
r8527 | if self.lenb is None: | ||
Bryan O'Sullivan
|
r4897 | self.lenb = 1 | ||
else: | ||||
self.lenb = int(self.lenb) | ||||
self.starta = int(self.starta) | ||||
self.startb = int(self.startb) | ||||
Brodie Rao
|
r16683 | diffhelpers.addlines(lr, self.hunk, self.lena, self.lenb, self.a, | ||
self.b) | ||||
Bryan O'Sullivan
|
r4897 | # if we hit eof before finishing out the hunk, the last line will | ||
# be zero length. Lets try to fix it up. | ||||
while len(self.hunk[-1]) == 0: | ||||
Dirkjan Ochtman
|
r6948 | del self.hunk[-1] | ||
del self.a[-1] | ||||
del self.b[-1] | ||||
self.lena -= 1 | ||||
self.lenb -= 1 | ||||
Patrick Mezard
|
r13699 | self._fixnewline(lr) | ||
Bryan O'Sullivan
|
r4897 | |||
def read_context_hunk(self, lr): | ||||
self.desc = lr.readline() | ||||
m = contextdesc.match(self.desc) | ||||
if not m: | ||||
Bryan O'Sullivan
|
r4898 | raise PatchError(_("bad hunk #%d") % self.number) | ||
Patrick Mezard
|
r15510 | self.starta, aend = m.groups() | ||
Bryan O'Sullivan
|
r4897 | self.starta = int(self.starta) | ||
Martin Geisler
|
r8527 | if aend is None: | ||
Bryan O'Sullivan
|
r4897 | aend = self.starta | ||
self.lena = int(aend) - self.starta | ||||
if self.starta: | ||||
self.lena += 1 | ||||
for x in xrange(self.lena): | ||||
l = lr.readline() | ||||
if l.startswith('---'): | ||||
Patrick Mezard
|
r12825 | # lines addition, old block is empty | ||
Bryan O'Sullivan
|
r4897 | lr.push(l) | ||
break | ||||
s = l[2:] | ||||
if l.startswith('- ') or l.startswith('! '): | ||||
u = '-' + s | ||||
elif l.startswith(' '): | ||||
u = ' ' + s | ||||
else: | ||||
Bryan O'Sullivan
|
r4898 | raise PatchError(_("bad hunk #%d old text line %d") % | ||
(self.number, x)) | ||||
Bryan O'Sullivan
|
r4897 | self.a.append(u) | ||
self.hunk.append(u) | ||||
l = lr.readline() | ||||
if l.startswith('\ '): | ||||
s = self.a[-1][:-1] | ||||
self.a[-1] = s | ||||
self.hunk[-1] = s | ||||
l = lr.readline() | ||||
m = contextdesc.match(l) | ||||
if not m: | ||||
Bryan O'Sullivan
|
r4898 | raise PatchError(_("bad hunk #%d") % self.number) | ||
Patrick Mezard
|
r15510 | self.startb, bend = m.groups() | ||
Bryan O'Sullivan
|
r4897 | self.startb = int(self.startb) | ||
Martin Geisler
|
r8527 | if bend is None: | ||
Bryan O'Sullivan
|
r4897 | bend = self.startb | ||
self.lenb = int(bend) - self.startb | ||||
if self.startb: | ||||
self.lenb += 1 | ||||
hunki = 1 | ||||
for x in xrange(self.lenb): | ||||
l = lr.readline() | ||||
if l.startswith('\ '): | ||||
Patrick Mezard
|
r12825 | # XXX: the only way to hit this is with an invalid line range. | ||
# The no-eol marker is not counted in the line range, but I | ||||
# guess there are diff(1) out there which behave differently. | ||||
Bryan O'Sullivan
|
r4897 | s = self.b[-1][:-1] | ||
self.b[-1] = s | ||||
Matt Mackall
|
r10282 | self.hunk[hunki - 1] = s | ||
Bryan O'Sullivan
|
r4897 | continue | ||
if not l: | ||||
Patrick Mezard
|
r12825 | # line deletions, new block is empty and we hit EOF | ||
Bryan O'Sullivan
|
r4897 | lr.push(l) | ||
break | ||||
s = l[2:] | ||||
if l.startswith('+ ') or l.startswith('! '): | ||||
u = '+' + s | ||||
elif l.startswith(' '): | ||||
u = ' ' + s | ||||
elif len(self.b) == 0: | ||||
Patrick Mezard
|
r12825 | # line deletions, new block is empty | ||
Bryan O'Sullivan
|
r4897 | lr.push(l) | ||
break | ||||
else: | ||||
Bryan O'Sullivan
|
r4898 | raise PatchError(_("bad hunk #%d old text line %d") % | ||
(self.number, x)) | ||||
Bryan O'Sullivan
|
r4897 | self.b.append(s) | ||
while True: | ||||
if hunki >= len(self.hunk): | ||||
h = "" | ||||
else: | ||||
h = self.hunk[hunki] | ||||
hunki += 1 | ||||
if h == u: | ||||
break | ||||
elif h.startswith('-'): | ||||
continue | ||||
else: | ||||
Matt Mackall
|
r10282 | self.hunk.insert(hunki - 1, u) | ||
Bryan O'Sullivan
|
r4897 | break | ||
if not self.a: | ||||
# this happens when lines were only added to the hunk | ||||
for x in self.hunk: | ||||
if x.startswith('-') or x.startswith(' '): | ||||
self.a.append(x) | ||||
if not self.b: | ||||
# this happens when lines were only deleted from the hunk | ||||
for x in self.hunk: | ||||
if x.startswith('+') or x.startswith(' '): | ||||
self.b.append(x[1:]) | ||||
# @@ -start,len +start,len @@ | ||||
self.desc = "@@ -%d,%d +%d,%d @@\n" % (self.starta, self.lena, | ||||
self.startb, self.lenb) | ||||
self.hunk[0] = self.desc | ||||
Patrick Mezard
|
r13699 | self._fixnewline(lr) | ||
Bryan O'Sullivan
|
r4897 | |||
Patrick Mezard
|
r13699 | def _fixnewline(self, lr): | ||
l = lr.readline() | ||||
if l.startswith('\ '): | ||||
diffhelpers.fix_newline(self.hunk, self.a, self.b) | ||||
else: | ||||
lr.push(l) | ||||
Bryan O'Sullivan
|
r4897 | |||
def complete(self): | ||||
return len(self.a) == self.lena and len(self.b) == self.lenb | ||||
Patrick Mezard
|
r16121 | def _fuzzit(self, old, new, fuzz, toponly): | ||
Bryan O'Sullivan
|
r4897 | # this removes context lines from the top and bottom of list 'l'. It | ||
# checks the hunk to make sure only context lines are removed, and then | ||||
# returns a new shortened list of lines. | ||||
Patrick Mezard
|
r16124 | fuzz = min(fuzz, len(old)) | ||
Bryan O'Sullivan
|
r4897 | if fuzz: | ||
top = 0 | ||||
bot = 0 | ||||
hlen = len(self.hunk) | ||||
Matt Mackall
|
r10282 | for x in xrange(hlen - 1): | ||
Bryan O'Sullivan
|
r4897 | # the hunk starts with the @@ line, so use x+1 | ||
Matt Mackall
|
r10282 | if self.hunk[x + 1][0] == ' ': | ||
Bryan O'Sullivan
|
r4897 | top += 1 | ||
else: | ||||
break | ||||
if not toponly: | ||||
Matt Mackall
|
r10282 | for x in xrange(hlen - 1): | ||
if self.hunk[hlen - bot - 1][0] == ' ': | ||||
Bryan O'Sullivan
|
r4897 | bot += 1 | ||
else: | ||||
break | ||||
Patrick Mezard
|
r16124 | bot = min(fuzz, bot) | ||
top = min(fuzz, top) | ||||
Mads Kiilerich
|
r18054 | return old[top:len(old) - bot], new[top:len(new) - bot], top | ||
Patrick Mezard
|
r16122 | return old, new, 0 | ||
Bryan O'Sullivan
|
r4897 | |||
Patrick Mezard
|
r16121 | def fuzzit(self, fuzz, toponly): | ||
Patrick Mezard
|
r16122 | old, new, top = self._fuzzit(self.a, self.b, fuzz, toponly) | ||
oldstart = self.starta + top | ||||
newstart = self.startb + top | ||||
# zero length hunk ranges already have their start decremented | ||||
Yuya Nishihara
|
r16650 | if self.lena and oldstart > 0: | ||
Patrick Mezard
|
r16122 | oldstart -= 1 | ||
Yuya Nishihara
|
r16650 | if self.lenb and newstart > 0: | ||
Patrick Mezard
|
r16122 | newstart -= 1 | ||
return old, oldstart, new, newstart | ||||
Bryan O'Sullivan
|
r4897 | |||
Thomas Arendsen Hein
|
r14764 | class binhunk(object): | ||
Nicolas Vigier
|
r20137 | 'A binary patch file.' | ||
Patrick Mezard
|
r16523 | def __init__(self, lr, fname): | ||
Bryan O'Sullivan
|
r4897 | self.text = None | ||
Nicolas Vigier
|
r20137 | self.delta = False | ||
Patrick Mezard
|
r9585 | self.hunk = ['GIT binary patch\n'] | ||
Patrick Mezard
|
r16523 | self._fname = fname | ||
Patrick Mezard
|
r14384 | self._read(lr) | ||
Bryan O'Sullivan
|
r4897 | |||
def complete(self): | ||||
return self.text is not None | ||||
Nicolas Vigier
|
r20137 | def new(self, lines): | ||
if self.delta: | ||||
return [applybindelta(self.text, ''.join(lines))] | ||||
Bryan O'Sullivan
|
r4897 | return [self.text] | ||
Patrick Mezard
|
r14384 | def _read(self, lr): | ||
Patrick Mezard
|
r16524 | def getline(lr, hunk): | ||
l = lr.readline() | ||||
hunk.append(l) | ||||
return l.rstrip('\r\n') | ||||
Nicolas Vigier
|
r20137 | size = 0 | ||
Patrick Mezard
|
r16567 | while True: | ||
Patrick Mezard
|
r16524 | line = getline(lr, self.hunk) | ||
Patrick Mezard
|
r16567 | if not line: | ||
raise PatchError(_('could not extract "%s" binary data') | ||||
% self._fname) | ||||
if line.startswith('literal '): | ||||
Nicolas Vigier
|
r20137 | size = int(line[8:].rstrip()) | ||
Patrick Mezard
|
r16567 | break | ||
Nicolas Vigier
|
r20137 | if line.startswith('delta '): | ||
size = int(line[6:].rstrip()) | ||||
self.delta = True | ||||
break | ||||
Brendan Cully
|
r3367 | dec = [] | ||
Patrick Mezard
|
r16524 | line = getline(lr, self.hunk) | ||
Bryan O'Sullivan
|
r4897 | while len(line) > 1: | ||
Brendan Cully
|
r3374 | l = line[0] | ||
if l <= 'Z' and l >= 'A': | ||||
l = ord(l) - ord('A') + 1 | ||||
else: | ||||
l = ord(l) - ord('a') + 27 | ||||
Patrick Mezard
|
r16522 | try: | ||
Patrick Mezard
|
r16524 | dec.append(base85.b85decode(line[1:])[:l]) | ||
Patrick Mezard
|
r16522 | except ValueError, e: | ||
Patrick Mezard
|
r16523 | raise PatchError(_('could not decode "%s" binary patch: %s') | ||
% (self._fname, str(e))) | ||||
Patrick Mezard
|
r16524 | line = getline(lr, self.hunk) | ||
Brendan Cully
|
r3367 | text = zlib.decompress(''.join(dec)) | ||
if len(text) != size: | ||||
Patrick Mezard
|
r16523 | raise PatchError(_('"%s" length is %d bytes, should be %d') | ||
% (self._fname, len(text), size)) | ||||
Bryan O'Sullivan
|
r4897 | self.text = text | ||
Brendan Cully
|
r3367 | |||
Bryan O'Sullivan
|
r4897 | def parsefilename(str): | ||
# --- filename \t|space stuff | ||||
Patrick Mezard
|
r5851 | s = str[4:].rstrip('\r\n') | ||
Bryan O'Sullivan
|
r4897 | i = s.find('\t') | ||
if i < 0: | ||||
i = s.find(' ') | ||||
if i < 0: | ||||
return s | ||||
return s[:i] | ||||
Brendan Cully
|
r2861 | |||
Laurent Charignon
|
r24341 | def parsepatch(originalchunks): | ||
Laurent Charignon
|
r24265 | """patch -> [] of headers -> [] of hunks """ | ||
class parser(object): | ||||
"""patch parsing state machine""" | ||||
def __init__(self): | ||||
self.fromline = 0 | ||||
self.toline = 0 | ||||
self.proc = '' | ||||
self.header = None | ||||
self.context = [] | ||||
self.before = [] | ||||
self.hunk = [] | ||||
self.headers = [] | ||||
def addrange(self, limits): | ||||
fromstart, fromend, tostart, toend, proc = limits | ||||
self.fromline = int(fromstart) | ||||
self.toline = int(tostart) | ||||
self.proc = proc | ||||
def addcontext(self, context): | ||||
if self.hunk: | ||||
h = recordhunk(self.header, self.fromline, self.toline, | ||||
self.proc, self.before, self.hunk, context) | ||||
self.header.hunks.append(h) | ||||
self.fromline += len(self.before) + h.removed | ||||
self.toline += len(self.before) + h.added | ||||
self.before = [] | ||||
self.hunk = [] | ||||
self.proc = '' | ||||
self.context = context | ||||
def addhunk(self, hunk): | ||||
if self.context: | ||||
self.before = self.context | ||||
self.context = [] | ||||
self.hunk = hunk | ||||
def newfile(self, hdr): | ||||
self.addcontext([]) | ||||
h = header(hdr) | ||||
self.headers.append(h) | ||||
self.header = h | ||||
def addother(self, line): | ||||
pass # 'other' lines are ignored | ||||
def finished(self): | ||||
self.addcontext([]) | ||||
return self.headers | ||||
transitions = { | ||||
'file': {'context': addcontext, | ||||
'file': newfile, | ||||
'hunk': addhunk, | ||||
'range': addrange}, | ||||
'context': {'file': newfile, | ||||
'hunk': addhunk, | ||||
'range': addrange, | ||||
'other': addother}, | ||||
'hunk': {'context': addcontext, | ||||
'file': newfile, | ||||
'range': addrange}, | ||||
'range': {'context': addcontext, | ||||
'hunk': addhunk}, | ||||
'other': {'other': addother}, | ||||
} | ||||
p = parser() | ||||
Laurent Charignon
|
r24341 | fp = cStringIO.StringIO() | ||
fp.write(''.join(originalchunks)) | ||||
fp.seek(0) | ||||
Laurent Charignon
|
r24265 | |||
state = 'context' | ||||
for newstate, data in scanpatch(fp): | ||||
try: | ||||
p.transitions[state][newstate](p, data) | ||||
except KeyError: | ||||
raise PatchError('unhandled transition: %s -> %s' % | ||||
(state, newstate)) | ||||
state = newstate | ||||
Laurent Charignon
|
r24341 | del fp | ||
Laurent Charignon
|
r24265 | return p.finished() | ||
Siddharth Agarwal
|
r24244 | def pathtransform(path, strip, prefix): | ||
Siddharth Agarwal
|
r24243 | '''turn a path from a patch into a path suitable for the repository | ||
Siddharth Agarwal
|
r24244 | prefix, if not empty, is expected to be normalized with a / at the end. | ||
Siddharth Agarwal
|
r24243 | Returns (stripped components, path in repository). | ||
Siddharth Agarwal
|
r24244 | >>> pathtransform('a/b/c', 0, '') | ||
Siddharth Agarwal
|
r24243 | ('', 'a/b/c') | ||
Siddharth Agarwal
|
r24244 | >>> pathtransform(' a/b/c ', 0, '') | ||
Siddharth Agarwal
|
r24243 | ('', ' a/b/c') | ||
Siddharth Agarwal
|
r24244 | >>> pathtransform(' a/b/c ', 2, '') | ||
Siddharth Agarwal
|
r24243 | ('a/b/', 'c') | ||
Siddharth Agarwal
|
r24385 | >>> pathtransform('a/b/c', 0, 'd/e/') | ||
('', 'd/e/a/b/c') | ||||
Siddharth Agarwal
|
r24244 | >>> pathtransform(' a//b/c ', 2, 'd/e/') | ||
('a//b/', 'd/e/c') | ||||
>>> pathtransform('a/b/c', 3, '') | ||||
Siddharth Agarwal
|
r24243 | Traceback (most recent call last): | ||
PatchError: unable to strip away 1 of 3 dirs from a/b/c | ||||
''' | ||||
Mads Kiilerich
|
r11022 | pathlen = len(path) | ||
i = 0 | ||||
if strip == 0: | ||||
Siddharth Agarwal
|
r24385 | return '', prefix + path.rstrip() | ||
Mads Kiilerich
|
r11022 | count = strip | ||
while count > 0: | ||||
i = path.find('/', i) | ||||
if i == -1: | ||||
raise PatchError(_("unable to strip away %d of %d dirs from %s") % | ||||
(count, strip, path)) | ||||
i += 1 | ||||
# consume '//' in the path | ||||
while i < pathlen - 1 and path[i] == '/': | ||||
i += 1 | ||||
count -= 1 | ||||
Siddharth Agarwal
|
r24244 | return path[:i].lstrip(), prefix + path[i:].rstrip() | ||
Mads Kiilerich
|
r11022 | |||
Siddharth Agarwal
|
r24245 | def makepatchmeta(backend, afile_orig, bfile_orig, hunk, strip, prefix): | ||
Bryan O'Sullivan
|
r4897 | nulla = afile_orig == "/dev/null" | ||
nullb = bfile_orig == "/dev/null" | ||||
Patrick Mezard
|
r14451 | create = nulla and hunk.starta == 0 and hunk.lena == 0 | ||
remove = nullb and hunk.startb == 0 and hunk.lenb == 0 | ||||
Siddharth Agarwal
|
r24245 | abase, afile = pathtransform(afile_orig, strip, prefix) | ||
Patrick Mezard
|
r14351 | gooda = not nulla and backend.exists(afile) | ||
Siddharth Agarwal
|
r24245 | bbase, bfile = pathtransform(bfile_orig, strip, prefix) | ||
Bryan O'Sullivan
|
r4897 | if afile == bfile: | ||
goodb = gooda | ||||
else: | ||||
Patrick Mezard
|
r14351 | goodb = not nullb and backend.exists(bfile) | ||
Patrick Mezard
|
r14451 | missing = not goodb and not gooda and not create | ||
Brendan Cully
|
r9328 | |||
Martin Geisler
|
r11820 | # some diff programs apparently produce patches where the afile is | ||
# not /dev/null, but afile starts with bfile | ||||
Benoit Boissinot
|
r10745 | abasedir = afile[:afile.rfind('/') + 1] | ||
bbasedir = bfile[:bfile.rfind('/') + 1] | ||||
Patrick Mezard
|
r14451 | if (missing and abasedir == bbasedir and afile.startswith(bfile) | ||
and hunk.starta == 0 and hunk.lena == 0): | ||||
create = True | ||||
missing = False | ||||
Brendan Cully
|
r9328 | |||
Patrick Mezard
|
r6295 | # If afile is "a/b/foo" and bfile is "a/b/foo.orig" we assume the | ||
# diff is between a file and its backup. In this case, the original | ||||
# file should be patched (see original mpatch code). | ||||
isbackup = (abase == bbase and bfile.startswith(afile)) | ||||
Patrick Mezard
|
r5652 | fname = None | ||
if not missing: | ||||
if gooda and goodb: | ||||
Jordi Gutiérrez Hermoso
|
r24306 | if isbackup: | ||
fname = afile | ||||
else: | ||||
fname = bfile | ||||
Patrick Mezard
|
r5652 | elif gooda: | ||
Bryan O'Sullivan
|
r4897 | fname = afile | ||
Thomas Arendsen Hein
|
r5760 | |||
Patrick Mezard
|
r5652 | if not fname: | ||
if not nullb: | ||||
Jordi Gutiérrez Hermoso
|
r24306 | if isbackup: | ||
fname = afile | ||||
else: | ||||
fname = bfile | ||||
Patrick Mezard
|
r5652 | elif not nulla: | ||
Bryan O'Sullivan
|
r4897 | fname = afile | ||
Patrick Mezard
|
r5652 | else: | ||
raise PatchError(_("undefined source and destination files")) | ||||
Thomas Arendsen Hein
|
r5760 | |||
Patrick Mezard
|
r14566 | gp = patchmeta(fname) | ||
if create: | ||||
gp.op = 'ADD' | ||||
elif remove: | ||||
gp.op = 'DELETE' | ||||
return gp | ||||
Bryan O'Sullivan
|
r4897 | |||
Laurent Charignon
|
r24264 | def scanpatch(fp): | ||
"""like patch.iterhunks, but yield different events | ||||
- ('file', [header_lines + fromfile + tofile]) | ||||
- ('context', [context_lines]) | ||||
- ('hunk', [hunk_lines]) | ||||
- ('range', (-start,len, +start,len, proc)) | ||||
""" | ||||
lines_re = re.compile(r'@@ -(\d+),(\d+) \+(\d+),(\d+) @@\s*(.*)') | ||||
lr = linereader(fp) | ||||
def scanwhile(first, p): | ||||
"""scan lr while predicate holds""" | ||||
lines = [first] | ||||
while True: | ||||
line = lr.readline() | ||||
if not line: | ||||
break | ||||
if p(line): | ||||
lines.append(line) | ||||
else: | ||||
lr.push(line) | ||||
break | ||||
return lines | ||||
while True: | ||||
line = lr.readline() | ||||
if not line: | ||||
break | ||||
if line.startswith('diff --git a/') or line.startswith('diff -r '): | ||||
def notheader(line): | ||||
s = line.split(None, 1) | ||||
return not s or s[0] not in ('---', 'diff') | ||||
header = scanwhile(line, notheader) | ||||
fromfile = lr.readline() | ||||
if fromfile.startswith('---'): | ||||
tofile = lr.readline() | ||||
header += [fromfile, tofile] | ||||
else: | ||||
lr.push(fromfile) | ||||
yield 'file', header | ||||
elif line[0] == ' ': | ||||
yield 'context', scanwhile(line, lambda l: l[0] in ' \\') | ||||
elif line[0] in '-+': | ||||
yield 'hunk', scanwhile(line, lambda l: l[0] in '-+\\') | ||||
else: | ||||
m = lines_re.match(line) | ||||
if m: | ||||
yield 'range', m.groups() | ||||
else: | ||||
yield 'other', line | ||||
Patrick Mezard
|
r7152 | def scangitpatch(lr, firstline): | ||
Dirkjan Ochtman
|
r7186 | """ | ||
Patrick Mezard
|
r7152 | Git patches can emit: | ||
- rename a to b | ||||
- change b | ||||
- copy a to c | ||||
- change c | ||||
Dirkjan Ochtman
|
r7186 | |||
Patrick Mezard
|
r7152 | We cannot apply this sequence as-is, the renamed 'a' could not be | ||
found for it would have been renamed already. And we cannot copy | ||||
from 'b' instead because 'b' would have been changed already. So | ||||
we scan the git patch for copy and rename commands so we can | ||||
perform the copies ahead of time. | ||||
""" | ||||
pos = 0 | ||||
try: | ||||
pos = lr.fp.tell() | ||||
fp = lr.fp | ||||
except IOError: | ||||
fp = cStringIO.StringIO(lr.fp.read()) | ||||
Patrick Mezard
|
r14418 | gitlr = linereader(fp) | ||
Patrick Mezard
|
r7152 | gitlr.push(firstline) | ||
Patrick Mezard
|
r12669 | gitpatches = readgitpatch(gitlr) | ||
Patrick Mezard
|
r7152 | fp.seek(pos) | ||
Patrick Mezard
|
r12669 | return gitpatches | ||
Patrick Mezard
|
r7152 | |||
Idan Kamara
|
r14240 | def iterhunks(fp): | ||
Patrick Mezard
|
r5650 | """Read a patch and yield the following events: | ||
- ("file", afile, bfile, firsthunk): select a new target file. | ||||
- ("hunk", hunk): a new hunk is ready to be applied, follows a | ||||
"file" event. | ||||
- ("git", gitchanges): current diff is in git format, gitchanges | ||||
maps filenames to gitpatch records. Unique event. | ||||
""" | ||||
Bryan O'Sullivan
|
r4897 | afile = "" | ||
bfile = "" | ||||
state = None | ||||
hunknum = 0 | ||||
Patrick Mezard
|
r14017 | emitfile = newfile = False | ||
Patrick Mezard
|
r14388 | gitpatches = None | ||
Brendan Cully
|
r2861 | |||
Bryan O'Sullivan
|
r4897 | # our states | ||
BFILE = 1 | ||||
context = None | ||||
Patrick Mezard
|
r10128 | lr = linereader(fp) | ||
Brendan Cully
|
r2861 | |||
Bryan O'Sullivan
|
r4897 | while True: | ||
x = lr.readline() | ||||
if not x: | ||||
break | ||||
Patrick Mezard
|
r14383 | if state == BFILE and ( | ||
(not context and x[0] == '@') | ||||
or (context is not False and x.startswith('***************')) | ||||
or x.startswith('GIT binary patch')): | ||||
Patrick Mezard
|
r14388 | gp = None | ||
Patrick Mezard
|
r14534 | if (gitpatches and | ||
Patrick Mezard
|
r16506 | gitpatches[-1].ispatching(afile, bfile)): | ||
gp = gitpatches.pop() | ||||
Patrick Mezard
|
r14383 | if x.startswith('GIT binary patch'): | ||
Patrick Mezard
|
r16523 | h = binhunk(lr, gp.path) | ||
Patrick Mezard
|
r14383 | else: | ||
if context is None and x.startswith('***************'): | ||||
context = True | ||||
Patrick Mezard
|
r14451 | h = hunk(x, hunknum + 1, lr, context) | ||
Bryan O'Sullivan
|
r4897 | hunknum += 1 | ||
Patrick Mezard
|
r5650 | if emitfile: | ||
emitfile = False | ||||
Patrick Mezard
|
r14566 | yield 'file', (afile, bfile, h, gp and gp.copy() or None) | ||
Patrick Mezard
|
r13699 | yield 'hunk', h | ||
Sean Farley
|
r18830 | elif x.startswith('diff --git a/'): | ||
Patrick Mezard
|
r16524 | m = gitre.match(x.rstrip(' \r\n')) | ||
Patrick Mezard
|
r14387 | if not m: | ||
continue | ||||
Patrick Mezard
|
r16506 | if gitpatches is None: | ||
Patrick Mezard
|
r14387 | # scan whole input for git metadata | ||
Patrick Mezard
|
r16506 | gitpatches = scangitpatch(lr, x) | ||
yield 'git', [g.copy() for g in gitpatches | ||||
if g.op in ('COPY', 'RENAME')] | ||||
Patrick Mezard
|
r14388 | gitpatches.reverse() | ||
Patrick Mezard
|
r14387 | afile = 'a/' + m.group(1) | ||
bfile = 'b/' + m.group(2) | ||||
Patrick Mezard
|
r16506 | while gitpatches and not gitpatches[-1].ispatching(afile, bfile): | ||
gp = gitpatches.pop() | ||||
Patrick Mezard
|
r14566 | yield 'file', ('a/' + gp.path, 'b/' + gp.path, None, gp.copy()) | ||
Patrick Mezard
|
r16506 | if not gitpatches: | ||
raise PatchError(_('failed to synchronize metadata for "%s"') | ||||
% afile[2:]) | ||||
gp = gitpatches[-1] | ||||
Patrick Mezard
|
r14387 | newfile = True | ||
Bryan O'Sullivan
|
r4897 | elif x.startswith('---'): | ||
# check for a unified diff | ||||
l2 = lr.readline() | ||||
if not l2.startswith('+++'): | ||||
lr.push(l2) | ||||
continue | ||||
newfile = True | ||||
context = False | ||||
afile = parsefilename(x) | ||||
bfile = parsefilename(l2) | ||||
elif x.startswith('***'): | ||||
# check for a context diff | ||||
l2 = lr.readline() | ||||
if not l2.startswith('---'): | ||||
lr.push(l2) | ||||
continue | ||||
l3 = lr.readline() | ||||
lr.push(l3) | ||||
if not l3.startswith("***************"): | ||||
lr.push(l2) | ||||
continue | ||||
newfile = True | ||||
context = True | ||||
afile = parsefilename(x) | ||||
bfile = parsefilename(l2) | ||||
Benoit Boissinot
|
r3057 | |||
Patrick Mezard
|
r14017 | if newfile: | ||
newfile = False | ||||
Patrick Mezard
|
r5650 | emitfile = True | ||
Bryan O'Sullivan
|
r4897 | state = BFILE | ||
hunknum = 0 | ||||
Patrick Mezard
|
r5650 | |||
Patrick Mezard
|
r14388 | while gitpatches: | ||
Patrick Mezard
|
r16506 | gp = gitpatches.pop() | ||
Patrick Mezard
|
r14566 | yield 'file', ('a/' + gp.path, 'b/' + gp.path, None, gp.copy()) | ||
Patrick Mezard
|
r14388 | |||
Nicolas Vigier
|
r20137 | def applybindelta(binchunk, data): | ||
"""Apply a binary delta hunk | ||||
The algorithm used is the algorithm from git's patch-delta.c | ||||
""" | ||||
def deltahead(binchunk): | ||||
i = 0 | ||||
for c in binchunk: | ||||
i += 1 | ||||
if not (ord(c) & 0x80): | ||||
return i | ||||
return i | ||||
out = "" | ||||
s = deltahead(binchunk) | ||||
binchunk = binchunk[s:] | ||||
s = deltahead(binchunk) | ||||
binchunk = binchunk[s:] | ||||
i = 0 | ||||
while i < len(binchunk): | ||||
cmd = ord(binchunk[i]) | ||||
i += 1 | ||||
if (cmd & 0x80): | ||||
offset = 0 | ||||
size = 0 | ||||
if (cmd & 0x01): | ||||
offset = ord(binchunk[i]) | ||||
i += 1 | ||||
if (cmd & 0x02): | ||||
offset |= ord(binchunk[i]) << 8 | ||||
i += 1 | ||||
if (cmd & 0x04): | ||||
offset |= ord(binchunk[i]) << 16 | ||||
i += 1 | ||||
if (cmd & 0x08): | ||||
offset |= ord(binchunk[i]) << 24 | ||||
i += 1 | ||||
if (cmd & 0x10): | ||||
size = ord(binchunk[i]) | ||||
i += 1 | ||||
if (cmd & 0x20): | ||||
size |= ord(binchunk[i]) << 8 | ||||
i += 1 | ||||
if (cmd & 0x40): | ||||
size |= ord(binchunk[i]) << 16 | ||||
i += 1 | ||||
if size == 0: | ||||
size = 0x10000 | ||||
offset_end = offset + size | ||||
out += data[offset:offset_end] | ||||
elif cmd != 0: | ||||
offset_end = i + cmd | ||||
out += binchunk[i:offset_end] | ||||
i += cmd | ||||
else: | ||||
raise PatchError(_('unexpected delta opcode 0')) | ||||
return out | ||||
Siddharth Agarwal
|
r24247 | def applydiff(ui, fp, backend, store, strip=1, prefix='', eolmode='strict'): | ||
Augie Fackler
|
r10966 | """Reads a patch from fp and tries to apply it. | ||
Patrick Mezard
|
r5650 | |||
Patrick Mezard
|
r14565 | Returns 0 for a clean patch, -1 if any rejects were found and 1 if | ||
there was any fuzz. | ||||
Patrick Mezard
|
r8810 | |||
Martin Geisler
|
r10101 | If 'eolmode' is 'strict', the patch content and patched file are | ||
read in binary mode. Otherwise, line endings are ignored when | ||||
patching then normalized according to 'eolmode'. | ||||
Patrick Mezard
|
r8810 | """ | ||
Patrick Mezard
|
r14565 | return _applydiff(ui, fp, patchfile, backend, store, strip=strip, | ||
Siddharth Agarwal
|
r24247 | prefix=prefix, eolmode=eolmode) | ||
Augie Fackler
|
r10966 | |||
Siddharth Agarwal
|
r24246 | def _applydiff(ui, fp, patcher, backend, store, strip=1, prefix='', | ||
Patrick Mezard
|
r14452 | eolmode='strict'): | ||
Patrick Mezard
|
r14389 | |||
Siddharth Agarwal
|
r24246 | if prefix: | ||
Siddharth Agarwal
|
r24390 | prefix = pathutil.canonpath(backend.repo.root, backend.repo.getcwd(), | ||
prefix) | ||||
if prefix != '': | ||||
prefix += '/' | ||||
Patrick Mezard
|
r14389 | def pstrip(p): | ||
Siddharth Agarwal
|
r24246 | return pathtransform(p, strip - 1, prefix)[1] | ||
Patrick Mezard
|
r14389 | |||
Patrick Mezard
|
r5650 | rejects = 0 | ||
err = 0 | ||||
current_file = None | ||||
Idan Kamara
|
r14240 | for state, values in iterhunks(fp): | ||
Patrick Mezard
|
r5650 | if state == 'hunk': | ||
if not current_file: | ||||
continue | ||||
Mads Kiilerich
|
r11021 | ret = current_file.apply(values) | ||
Patrick Mezard
|
r14565 | if ret > 0: | ||
err = 1 | ||||
Patrick Mezard
|
r5650 | elif state == 'file': | ||
Patrick Mezard
|
r13701 | if current_file: | ||
rejects += current_file.close() | ||||
Patrick Mezard
|
r14388 | current_file = None | ||
afile, bfile, first_hunk, gp = values | ||||
if gp: | ||||
Patrick Mezard
|
r14566 | gp.path = pstrip(gp.path) | ||
Patrick Mezard
|
r14452 | if gp.oldpath: | ||
Patrick Mezard
|
r14566 | gp.oldpath = pstrip(gp.oldpath) | ||
else: | ||||
Siddharth Agarwal
|
r24246 | gp = makepatchmeta(backend, afile, bfile, first_hunk, strip, | ||
prefix) | ||||
Patrick Mezard
|
r14566 | if gp.op == 'RENAME': | ||
backend.unlink(gp.oldpath) | ||||
Patrick Mezard
|
r14388 | if not first_hunk: | ||
Patrick Mezard
|
r14566 | if gp.op == 'DELETE': | ||
backend.unlink(gp.path) | ||||
continue | ||||
data, mode = None, None | ||||
if gp.op in ('RENAME', 'COPY'): | ||||
Patrick Mezard
|
r14609 | data, mode = store.getfile(gp.oldpath)[:2] | ||
Mads Kiilerich
|
r22296 | # FIXME: failing getfile has never been handled here | ||
assert data is not None | ||||
Patrick Mezard
|
r14566 | if gp.mode: | ||
mode = gp.mode | ||||
if gp.op == 'ADD': | ||||
# Added files without content have no hunk and | ||||
# must be created | ||||
data = '' | ||||
if data or mode: | ||||
if (gp.op in ('ADD', 'RENAME', 'COPY') | ||||
and backend.exists(gp.path)): | ||||
raise PatchError(_("cannot create %s: destination " | ||||
"already exists") % gp.path) | ||||
backend.setfile(gp.path, data, mode, gp.oldpath) | ||||
Patrick Mezard
|
r14388 | continue | ||
Patrick Mezard
|
r5650 | try: | ||
Patrick Mezard
|
r14566 | current_file = patcher(ui, gp, backend, store, | ||
eolmode=eolmode) | ||||
Martin Geisler
|
r14218 | except PatchError, inst: | ||
ui.warn(str(inst) + '\n') | ||||
Mads Kiilerich
|
r11021 | current_file = None | ||
Patrick Mezard
|
r5650 | rejects += 1 | ||
continue | ||||
elif state == 'git': | ||||
Mads Kiilerich
|
r11021 | for gp in values: | ||
Patrick Mezard
|
r14452 | path = pstrip(gp.oldpath) | ||
Mads Kiilerich
|
r22296 | data, mode = backend.getfile(path) | ||
if data is None: | ||||
Patrick Mezard
|
r16813 | # The error ignored here will trigger a getfile() | ||
# error in a place more appropriate for error | ||||
# handling, and will not interrupt the patching | ||||
# process. | ||||
Mads Kiilerich
|
r22296 | pass | ||
Patrick Mezard
|
r16813 | else: | ||
store.setfile(path, data, mode) | ||||
Bryan O'Sullivan
|
r4897 | else: | ||
Patrick Mezard
|
r5650 | raise util.Abort(_('unsupported parser state: %s') % state) | ||
Patrick Mezard
|
r5649 | |||
Patrick Mezard
|
r13701 | if current_file: | ||
rejects += current_file.close() | ||||
Patrick Mezard
|
r5650 | |||
Bryan O'Sullivan
|
r4897 | if rejects: | ||
return -1 | ||||
return err | ||||
Vadim Gelfer
|
r2874 | |||
Patrick Mezard
|
r14382 | def _externalpatch(ui, repo, patcher, patchname, strip, files, | ||
Patrick Mezard
|
r14381 | similarity): | ||
Patrick Mezard
|
r7151 | """use <patcher> to apply <patchname> to the working directory. | ||
returns whether patch was applied with fuzz factor.""" | ||||
fuzz = False | ||||
Patrick Mezard
|
r12673 | args = [] | ||
Patrick Mezard
|
r14382 | cwd = repo.root | ||
Patrick Mezard
|
r7151 | if cwd: | ||
args.append('-d %s' % util.shellquote(cwd)) | ||||
fp = util.popen('%s %s -p%d < %s' % (patcher, ' '.join(args), strip, | ||||
util.shellquote(patchname))) | ||||
Patrick Mezard
|
r14381 | try: | ||
for line in fp: | ||||
line = line.rstrip() | ||||
ui.note(line + '\n') | ||||
if line.startswith('patching file '): | ||||
pf = util.parsepatchoutput(line) | ||||
printed_file = False | ||||
Patrick Mezard
|
r14564 | files.add(pf) | ||
Patrick Mezard
|
r14381 | elif line.find('with fuzz') >= 0: | ||
fuzz = True | ||||
if not printed_file: | ||||
ui.warn(pf + '\n') | ||||
printed_file = True | ||||
ui.warn(line + '\n') | ||||
elif line.find('saving rejects to file') >= 0: | ||||
ui.warn(line + '\n') | ||||
elif line.find('FAILED') >= 0: | ||||
if not printed_file: | ||||
ui.warn(pf + '\n') | ||||
printed_file = True | ||||
ui.warn(line + '\n') | ||||
finally: | ||||
if files: | ||||
Siddharth Agarwal
|
r19155 | scmutil.marktouched(repo, files, similarity) | ||
Patrick Mezard
|
r7151 | code = fp.close() | ||
if code: | ||||
raise PatchError(_("patch command failed: %s") % | ||||
Adrian Buehlmann
|
r14234 | util.explainexit(code)[0]) | ||
Patrick Mezard
|
r7151 | return fuzz | ||
Siddharth Agarwal
|
r24253 | def patchbackend(ui, backend, patchobj, strip, prefix, files=None, | ||
eolmode='strict'): | ||||
Benoit Boissinot
|
r9683 | if files is None: | ||
Patrick Mezard
|
r14564 | files = set() | ||
Patrick Mezard
|
r8810 | if eolmode is None: | ||
eolmode = ui.config('patch', 'eol', 'strict') | ||||
Martin Geisler
|
r10101 | if eolmode.lower() not in eolmodes: | ||
Martin Geisler
|
r12067 | raise util.Abort(_('unsupported line endings type: %s') % eolmode) | ||
Martin Geisler
|
r10101 | eolmode = eolmode.lower() | ||
Dirkjan Ochtman
|
r8843 | |||
Patrick Mezard
|
r14452 | store = filestore() | ||
Patrick Mezard
|
r7151 | try: | ||
Alejandro Santos
|
r9031 | fp = open(patchobj, 'rb') | ||
Patrick Mezard
|
r7151 | except TypeError: | ||
fp = patchobj | ||||
try: | ||||
Siddharth Agarwal
|
r24253 | ret = applydiff(ui, fp, backend, store, strip=strip, prefix=prefix, | ||
Patrick Mezard
|
r14452 | eolmode=eolmode) | ||
Patrick Mezard
|
r7151 | finally: | ||
Patrick Mezard
|
r10203 | if fp != patchobj: | ||
fp.close() | ||||
Patrick Mezard
|
r14564 | files.update(backend.close()) | ||
Patrick Mezard
|
r14452 | store.close() | ||
Patrick Mezard
|
r7151 | if ret < 0: | ||
Patrick Mezard
|
r12674 | raise PatchError(_('patch failed to apply')) | ||
Patrick Mezard
|
r7151 | return ret > 0 | ||
Siddharth Agarwal
|
r24268 | def internalpatch(ui, repo, patchobj, strip, prefix='', files=None, | ||
Siddharth Agarwal
|
r24254 | eolmode='strict', similarity=0): | ||
Patrick Mezard
|
r14611 | """use builtin patch to apply <patchobj> to the working directory. | ||
returns whether patch was applied with fuzz factor.""" | ||||
backend = workingbackend(ui, repo, similarity) | ||||
Siddharth Agarwal
|
r24254 | return patchbackend(ui, backend, patchobj, strip, prefix, files, eolmode) | ||
Patrick Mezard
|
r14611 | |||
Siddharth Agarwal
|
r24260 | def patchrepo(ui, repo, ctx, store, patchobj, strip, prefix, files=None, | ||
Patrick Mezard
|
r14611 | eolmode='strict'): | ||
backend = repobackend(ui, repo, ctx, store) | ||||
Siddharth Agarwal
|
r24260 | return patchbackend(ui, backend, patchobj, strip, prefix, files, eolmode) | ||
Patrick Mezard
|
r14611 | |||
Siddharth Agarwal
|
r24259 | def patch(ui, repo, patchname, strip=1, prefix='', files=None, eolmode='strict', | ||
Patrick Mezard
|
r14260 | similarity=0): | ||
Patrick Mezard
|
r8810 | """Apply <patchname> to the working directory. | ||
'eolmode' specifies how end of lines should be handled. It can be: | ||||
- 'strict': inputs are read in binary mode, EOLs are preserved | ||||
- 'crlf': EOLs are ignored when patching and reset to CRLF | ||||
- 'lf': EOLs are ignored when patching and reset to LF | ||||
- None: get it from user settings, default to 'strict' | ||||
'eolmode' is ignored when using an external patcher program. | ||||
Returns whether patch was applied with fuzz factor. | ||||
""" | ||||
Patrick Mezard
|
r7151 | patcher = ui.config('ui', 'patch') | ||
Benoit Boissinot
|
r9683 | if files is None: | ||
Patrick Mezard
|
r14564 | files = set() | ||
Pierre-Yves David
|
r21553 | if patcher: | ||
return _externalpatch(ui, repo, patcher, patchname, strip, | ||||
files, similarity) | ||||
Siddharth Agarwal
|
r24259 | return internalpatch(ui, repo, patchname, strip, prefix, files, eolmode, | ||
Pierre-Yves David
|
r21553 | similarity) | ||
Patrick Mezard
|
r7151 | |||
Patrick Mezard
|
r14351 | def changedfiles(ui, repo, patchpath, strip=1): | ||
backend = fsbackend(ui, repo.root) | ||||
Idan Kamara
|
r14255 | fp = open(patchpath, 'rb') | ||
try: | ||||
changed = set() | ||||
for state, values in iterhunks(fp): | ||||
Patrick Mezard
|
r14389 | if state == 'file': | ||
Patrick Mezard
|
r14388 | afile, bfile, first_hunk, gp = values | ||
if gp: | ||||
Siddharth Agarwal
|
r24244 | gp.path = pathtransform(gp.path, strip - 1, '')[1] | ||
Patrick Mezard
|
r14566 | if gp.oldpath: | ||
Siddharth Agarwal
|
r24244 | gp.oldpath = pathtransform(gp.oldpath, strip - 1, '')[1] | ||
Patrick Mezard
|
r14566 | else: | ||
Siddharth Agarwal
|
r24245 | gp = makepatchmeta(backend, afile, bfile, first_hunk, strip, | ||
'') | ||||
Patrick Mezard
|
r14566 | changed.add(gp.path) | ||
if gp.op == 'RENAME': | ||||
changed.add(gp.oldpath) | ||||
Patrick Mezard
|
r14389 | elif state not in ('hunk', 'git'): | ||
Idan Kamara
|
r14255 | raise util.Abort(_('unsupported parser state: %s') % state) | ||
return changed | ||||
finally: | ||||
fp.close() | ||||
Patrick Mezard
|
r10189 | class GitDiffRequired(Exception): | ||
pass | ||||
Dirkjan Ochtman
|
r7198 | |||
Siddharth Agarwal
|
r23431 | def diffallopts(ui, opts=None, untrusted=False, section='diff'): | ||
Siddharth Agarwal
|
r23430 | '''return diffopts with all features supported and parsed''' | ||
Siddharth Agarwal
|
r23433 | return difffeatureopts(ui, opts=opts, untrusted=untrusted, section=section, | ||
Siddharth Agarwal
|
r23434 | git=True, whitespace=True, formatchanging=True) | ||
Siddharth Agarwal
|
r23430 | |||
Siddharth Agarwal
|
r23431 | diffopts = diffallopts | ||
Siddharth Agarwal
|
r23433 | def difffeatureopts(ui, opts=None, untrusted=False, section='diff', git=False, | ||
Siddharth Agarwal
|
r23434 | whitespace=False, formatchanging=False): | ||
Siddharth Agarwal
|
r23432 | '''return diffopts with only opted-in features parsed | ||
Features: | ||||
- git: git-style diffs | ||||
Siddharth Agarwal
|
r23433 | - whitespace: whitespace options like ignoreblanklines and ignorews | ||
Siddharth Agarwal
|
r23434 | - formatchanging: options that will likely break or cause correctness issues | ||
with most diff parsers | ||||
Siddharth Agarwal
|
r23432 | ''' | ||
Siddharth Agarwal
|
r23295 | def get(key, name=None, getter=ui.configbool, forceplain=None): | ||
if opts: | ||||
v = opts.get(key) | ||||
if v: | ||||
return v | ||||
Siddharth Agarwal
|
r23296 | if forceplain is not None and ui.plain(): | ||
return forceplain | ||||
Siddharth Agarwal
|
r23295 | return getter(section, name or key, None, untrusted=untrusted) | ||
Siddharth Agarwal
|
r23434 | # core options, expected to be understood by every diff parser | ||
Siddharth Agarwal
|
r23429 | buildopts = { | ||
'nodates': get('nodates'), | ||||
'showfunc': get('show_function', 'showfunc'), | ||||
'context': get('unified', getter=ui.config), | ||||
} | ||||
Siddharth Agarwal
|
r23432 | if git: | ||
buildopts['git'] = get('git') | ||||
Siddharth Agarwal
|
r23433 | if whitespace: | ||
buildopts['ignorews'] = get('ignore_all_space', 'ignorews') | ||||
buildopts['ignorewsamount'] = get('ignore_space_change', | ||||
'ignorewsamount') | ||||
buildopts['ignoreblanklines'] = get('ignore_blank_lines', | ||||
'ignoreblanklines') | ||||
Siddharth Agarwal
|
r23434 | if formatchanging: | ||
buildopts['text'] = opts and opts.get('text') | ||||
buildopts['nobinary'] = get('nobinary') | ||||
buildopts['noprefix'] = get('noprefix', forceplain=False) | ||||
Siddharth Agarwal
|
r23432 | |||
Siddharth Agarwal
|
r23429 | return mdiff.diffopts(**buildopts) | ||
Benoit Boissinot
|
r10615 | |||
Patrick Mezard
|
r10189 | def diff(repo, node1=None, node2=None, match=None, changes=None, opts=None, | ||
Siddharth Agarwal
|
r24417 | losedatafn=None, prefix='', relroot=''): | ||
Dirkjan Ochtman
|
r7308 | '''yields diff of changes to files between two nodes, or node and | ||
Vadim Gelfer
|
r2874 | working directory. | ||
if node1 is None, use first dirstate parent instead. | ||||
Patrick Mezard
|
r10189 | if node2 is None, compare node1 with working directory. | ||
losedatafn(**kwarg) is a callable run when opts.upgrade=True and | ||||
every time some change cannot be represented with the current | ||||
patch format. Return False to upgrade to git patch format, True to | ||||
accept the loss or raise an exception to abort the diff. It is | ||||
called with the name of current file being diffed as 'fn'. If set | ||||
to None, patches will always be upgraded to git format when | ||||
necessary. | ||||
Martin Geisler
|
r12167 | |||
prefix is a filename prefix that is prepended to all filenames on | ||||
display (used for subrepos). | ||||
Siddharth Agarwal
|
r24417 | |||
relroot, if not empty, must be normalized with a trailing /. Any match | ||||
patterns that fall outside it will be ignored.''' | ||||
Vadim Gelfer
|
r2874 | |||
if opts is None: | ||||
opts = mdiff.defaultopts | ||||
Yannick Gingras
|
r9725 | if not node1 and not node2: | ||
Matt Mackall
|
r13878 | node1 = repo.dirstate.p1() | ||
Brendan Cully
|
r2934 | |||
Brendan Cully
|
r9123 | def lrugetfilectx(): | ||
cache = {} | ||||
Martin von Zweigbergk
|
r25113 | order = collections.deque() | ||
Brendan Cully
|
r9123 | def getfilectx(f, ctx): | ||
fctx = ctx.filectx(f, filelog=cache.get(f)) | ||||
if f not in cache: | ||||
if len(cache) > 20: | ||||
Bryan O'Sullivan
|
r16803 | del cache[order.popleft()] | ||
Benoit Boissinot
|
r9684 | cache[f] = fctx.filelog() | ||
Brendan Cully
|
r9123 | else: | ||
order.remove(f) | ||||
order.append(f) | ||||
return fctx | ||||
return getfilectx | ||||
getfilectx = lrugetfilectx() | ||||
Brendan Cully
|
r2934 | |||
Matt Mackall
|
r6747 | ctx1 = repo[node1] | ||
Matt Mackall
|
r7090 | ctx2 = repo[node2] | ||
Vadim Gelfer
|
r2874 | |||
Siddharth Agarwal
|
r24433 | relfiltered = False | ||
if relroot != '' and match.always(): | ||||
# as a special case, create a new matcher with just the relroot | ||||
pats = [relroot] | ||||
match = scmutil.match(ctx2, pats, default='path') | ||||
relfiltered = True | ||||
Vadim Gelfer
|
r2874 | if not changes: | ||
Matt Mackall
|
r7090 | changes = repo.status(ctx1, ctx2, match=match) | ||
Matt Mackall
|
r6760 | modified, added, removed = changes[:3] | ||
Vadim Gelfer
|
r2874 | |||
if not modified and not added and not removed: | ||||
Patrick Mezard
|
r10189 | return [] | ||
Jordi Gutiérrez Hermoso
|
r24306 | if repo.ui.debugflag: | ||
hexfunc = hex | ||||
else: | ||||
hexfunc = short | ||||
Sean Farley
|
r21833 | revs = [hexfunc(node) for node in [ctx1.node(), ctx2.node()] if node] | ||
Patrick Mezard
|
r10189 | |||
copy = {} | ||||
if opts.git or opts.upgrade: | ||||
Durham Goode
|
r24783 | copy = copies.pathcopies(ctx1, ctx2, match=match) | ||
Patrick Mezard
|
r10189 | |||
Siddharth Agarwal
|
r24417 | if relroot is not None: | ||
Siddharth Agarwal
|
r24433 | if not relfiltered: | ||
# XXX this would ideally be done in the matcher, but that is | ||||
# generally meant to 'or' patterns, not 'and' them. In this case we | ||||
# need to 'and' all the patterns from the matcher with relroot. | ||||
def filterrel(l): | ||||
return [f for f in l if f.startswith(relroot)] | ||||
modified = filterrel(modified) | ||||
added = filterrel(added) | ||||
removed = filterrel(removed) | ||||
relfiltered = True | ||||
Siddharth Agarwal
|
r24417 | # filter out copies where either side isn't inside the relative root | ||
copy = dict(((dst, src) for (dst, src) in copy.iteritems() | ||||
if dst.startswith(relroot) | ||||
and src.startswith(relroot))) | ||||
Mads Kiilerich
|
r17299 | def difffn(opts, losedata): | ||
return trydiff(repo, revs, ctx1, ctx2, modified, added, removed, | ||||
Siddharth Agarwal
|
r24417 | copy, getfilectx, opts, losedata, prefix, relroot) | ||
Patrick Mezard
|
r10189 | if opts.upgrade and not opts.git: | ||
try: | ||||
def losedata(fn): | ||||
if not losedatafn or not losedatafn(fn=fn): | ||||
Brodie Rao
|
r16687 | raise GitDiffRequired | ||
Patrick Mezard
|
r10189 | # Buffer the whole output until we are sure it can be generated | ||
return list(difffn(opts.copy(git=False), losedata)) | ||||
except GitDiffRequired: | ||||
return difffn(opts.copy(git=True), None) | ||||
else: | ||||
return difffn(opts, None) | ||||
Brodie Rao
|
r10818 | def difflabel(func, *args, **kw): | ||
'''yields 2-tuples of (output, label) based on the output of func()''' | ||||
Kirill Elagin
|
r15201 | headprefixes = [('diff', 'diff.diffline'), | ||
('copy', 'diff.extended'), | ||||
('rename', 'diff.extended'), | ||||
('old', 'diff.extended'), | ||||
('new', 'diff.extended'), | ||||
('deleted', 'diff.extended'), | ||||
('---', 'diff.file_a'), | ||||
('+++', 'diff.file_b')] | ||||
textprefixes = [('@', 'diff.hunk'), | ||||
('-', 'diff.deleted'), | ||||
('+', 'diff.inserted')] | ||||
head = False | ||||
Brodie Rao
|
r10818 | for chunk in func(*args, **kw): | ||
lines = chunk.split('\n') | ||||
for i, line in enumerate(lines): | ||||
if i != 0: | ||||
yield ('\n', '') | ||||
Kirill Elagin
|
r15201 | if head: | ||
if line.startswith('@'): | ||||
head = False | ||||
else: | ||||
Brodie Rao
|
r16686 | if line and line[0] not in ' +-@\\': | ||
Kirill Elagin
|
r15201 | head = True | ||
Brodie Rao
|
r10818 | stripline = line | ||
Jordi Gutiérrez Hermoso
|
r22460 | diffline = False | ||
Kirill Elagin
|
r15201 | if not head and line and line[0] in '+-': | ||
Jordi Gutiérrez Hermoso
|
r22460 | # highlight tabs and trailing whitespace, but only in | ||
# changed lines | ||||
Brodie Rao
|
r10818 | stripline = line.rstrip() | ||
Jordi Gutiérrez Hermoso
|
r22460 | diffline = True | ||
Kirill Elagin
|
r15201 | prefixes = textprefixes | ||
if head: | ||||
prefixes = headprefixes | ||||
Brodie Rao
|
r10818 | for prefix, label in prefixes: | ||
if stripline.startswith(prefix): | ||||
Jordi Gutiérrez Hermoso
|
r22460 | if diffline: | ||
for token in tabsplitter.findall(stripline): | ||||
if '\t' == token[0]: | ||||
yield (token, 'diff.tab') | ||||
else: | ||||
yield (token, label) | ||||
else: | ||||
yield (stripline, label) | ||||
Brodie Rao
|
r10818 | break | ||
else: | ||||
yield (line, '') | ||||
if line != stripline: | ||||
yield (line[len(stripline):], 'diff.trailingwhitespace') | ||||
def diffui(*args, **kw): | ||||
'''like diff(), but yields 2-tuples of (output, label) for ui.write()''' | ||||
return difflabel(diff, *args, **kw) | ||||
Martin von Zweigbergk
|
r24106 | def _filepairs(ctx1, modified, added, removed, copy, opts): | ||
'''generates tuples (f1, f2, copyop), where f1 is the name of the file | ||||
before and f2 is the the name after. For added files, f1 will be None, | ||||
and for removed files, f2 will be None. copyop may be set to None, 'copy' | ||||
or 'rename' (the latter two only if opts.git is set).''' | ||||
gone = set() | ||||
copyto = dict([(v, k) for k, v in copy.items()]) | ||||
addedset, removedset = set(added), set(removed) | ||||
# Fix up added, since merged-in additions appear as | ||||
# modifications during merges | ||||
for f in modified: | ||||
if f not in ctx1: | ||||
addedset.add(f) | ||||
for f in sorted(modified + added + removed): | ||||
copyop = None | ||||
f1, f2 = f, f | ||||
if f in addedset: | ||||
f1 = None | ||||
if f in copy: | ||||
if opts.git: | ||||
f1 = copy[f] | ||||
if f1 in removedset and f1 not in gone: | ||||
copyop = 'rename' | ||||
gone.add(f1) | ||||
else: | ||||
copyop = 'copy' | ||||
elif f in removedset: | ||||
f2 = None | ||||
if opts.git: | ||||
# have we already reported a copy above? | ||||
if (f in copyto and copyto[f] in addedset | ||||
and copy[copyto[f]] == f): | ||||
continue | ||||
yield f1, f2, copyop | ||||
Patrick Mezard
|
r10189 | def trydiff(repo, revs, ctx1, ctx2, modified, added, removed, | ||
Siddharth Agarwal
|
r24416 | copy, getfilectx, opts, losedatafn, prefix, relroot): | ||
Siddharth Agarwal
|
r24371 | '''given input data, generate a diff and yield it in blocks | ||
If generating a diff would lose data like flags or binary data and | ||||
losedatafn is not None, it will be called. | ||||
Siddharth Agarwal
|
r24416 | relroot is removed and prefix is added to every path in the diff output. | ||
If relroot is not empty, this function expects every path in modified, | ||||
added, removed and copy to start with it.''' | ||||
Martin Geisler
|
r12167 | |||
Guillermo Pérez
|
r17946 | def gitindex(text): | ||
if not text: | ||||
Johan Bjork
|
r19875 | text = "" | ||
Guillermo Pérez
|
r17946 | l = len(text) | ||
s = util.sha1('blob %d\0' % l) | ||||
s.update(text) | ||||
return s.hexdigest() | ||||
Siddharth Agarwal
|
r23300 | if opts.noprefix: | ||
aprefix = bprefix = '' | ||||
else: | ||||
aprefix = 'a/' | ||||
bprefix = 'b/' | ||||
Martin von Zweigbergk
|
r24021 | def diffline(f, revs): | ||
Martin von Zweigbergk
|
r24024 | revinfo = ' '.join(["-r %s" % rev for rev in revs]) | ||
Martin von Zweigbergk
|
r24025 | return 'diff %s %s' % (revinfo, f) | ||
Guillermo Pérez
|
r17941 | |||
Matt Mackall
|
r7090 | date1 = util.datestr(ctx1.date()) | ||
Martin von Zweigbergk
|
r23662 | date2 = util.datestr(ctx2.date()) | ||
Benoit Boissinot
|
r3967 | |||
Patrick Mezard
|
r10189 | gitmode = {'l': '120000', 'x': '100755', '': '100644'} | ||
Vadim Gelfer
|
r2874 | |||
Siddharth Agarwal
|
r24416 | if relroot != '' and (repo.ui.configbool('devel', 'all') | ||
or repo.ui.configbool('devel', 'check-relroot')): | ||||
for f in modified + added + removed + copy.keys() + copy.values(): | ||||
if f is not None and not f.startswith(relroot): | ||||
raise AssertionError( | ||||
"file %s doesn't start with relroot %s" % (f, relroot)) | ||||
Martin von Zweigbergk
|
r24106 | for f1, f2, copyop in _filepairs( | ||
ctx1, modified, added, removed, copy, opts): | ||||
Martin von Zweigbergk
|
r24105 | content1 = None | ||
content2 = None | ||||
Martin von Zweigbergk
|
r24103 | flag1 = None | ||
flag2 = None | ||||
Martin von Zweigbergk
|
r24107 | if f1: | ||
content1 = getfilectx(f1, ctx1).data() | ||||
if opts.git or losedatafn: | ||||
flag1 = ctx1.flags(f1) | ||||
if f2: | ||||
content2 = getfilectx(f2, ctx2).data() | ||||
if opts.git or losedatafn: | ||||
flag2 = ctx2.flags(f2) | ||||
Martin von Zweigbergk
|
r24102 | binary = False | ||
if opts.git or losedatafn: | ||||
Martin von Zweigbergk
|
r24058 | binary = util.binary(content1) or util.binary(content2) | ||
Martin von Zweigbergk
|
r24057 | |||
if losedatafn and not opts.git: | ||||
if (binary or | ||||
# copy/rename | ||||
Martin von Zweigbergk
|
r24106 | f2 in copy or | ||
Martin von Zweigbergk
|
r24057 | # empty file creation | ||
Martin von Zweigbergk
|
r24101 | (not f1 and not content2) or | ||
Martin von Zweigbergk
|
r24057 | # empty file deletion | ||
Martin von Zweigbergk
|
r24101 | (not content1 and not f2) or | ||
Martin von Zweigbergk
|
r24057 | # create with flags | ||
Martin von Zweigbergk
|
r24101 | (not f1 and flag2) or | ||
Martin von Zweigbergk
|
r24057 | # change flags | ||
Martin von Zweigbergk
|
r24101 | (f1 and f2 and flag1 != flag2)): | ||
Martin von Zweigbergk
|
r24106 | losedatafn(f2 or f1) | ||
Patrick Mezard
|
r10189 | |||
Siddharth Agarwal
|
r24416 | path1 = f1 or f2 | ||
path2 = f2 or f1 | ||||
path1 = posixpath.join(prefix, path1[len(relroot):]) | ||||
path2 = posixpath.join(prefix, path2[len(relroot):]) | ||||
Martin von Zweigbergk
|
r23998 | header = [] | ||
Martin von Zweigbergk
|
r24022 | if opts.git: | ||
Martin von Zweigbergk
|
r24025 | header.append('diff --git %s%s %s%s' % | ||
Martin von Zweigbergk
|
r24020 | (aprefix, path1, bprefix, path2)) | ||
Martin von Zweigbergk
|
r24101 | if not f1: # added | ||
Martin von Zweigbergk
|
r24025 | header.append('new file mode %s' % gitmode[flag2]) | ||
Martin von Zweigbergk
|
r24101 | elif not f2: # removed | ||
Martin von Zweigbergk
|
r24025 | header.append('deleted file mode %s' % gitmode[flag1]) | ||
Martin von Zweigbergk
|
r23998 | else: # modified/copied/renamed | ||
Martin von Zweigbergk
|
r24000 | mode1, mode2 = gitmode[flag1], gitmode[flag2] | ||
if mode1 != mode2: | ||||
Martin von Zweigbergk
|
r24025 | header.append('old mode %s' % mode1) | ||
header.append('new mode %s' % mode2) | ||||
Martin von Zweigbergk
|
r24055 | if copyop is not None: | ||
header.append('%s from %s' % (copyop, path1)) | ||||
header.append('%s to %s' % (copyop, path2)) | ||||
Martin von Zweigbergk
|
r24024 | elif revs and not repo.ui.quiet: | ||
Martin von Zweigbergk
|
r24022 | header.append(diffline(path1, revs)) | ||
Martin von Zweigbergk
|
r23998 | |||
Martin von Zweigbergk
|
r24056 | if binary and opts.git and not opts.nobinary: | ||
Martin von Zweigbergk
|
r23997 | text = mdiff.b85diff(content1, content2) | ||
Martin von Zweigbergk
|
r24056 | if text: | ||
Martin von Zweigbergk
|
r24025 | header.append('index %s..%s' % | ||
Martin von Zweigbergk
|
r24005 | (gitindex(content1), gitindex(content2))) | ||
Martin von Zweigbergk
|
r23753 | else: | ||
Martin von Zweigbergk
|
r23997 | text = mdiff.unidiff(content1, date1, | ||
content2, date2, | ||||
Martin von Zweigbergk
|
r23999 | path1, path2, opts=opts) | ||
Martin von Zweigbergk
|
r23753 | if header and (text or len(header) > 1): | ||
Martin von Zweigbergk
|
r24025 | yield '\n'.join(header) + '\n' | ||
Martin von Zweigbergk
|
r23753 | if text: | ||
yield text | ||||
Vadim Gelfer
|
r2874 | |||
Matt Mackall
|
r14401 | def diffstatsum(stats): | ||
Steven Brown
|
r14437 | maxfile, maxtotal, addtotal, removetotal, binary = 0, 0, 0, 0, False | ||
Matt Mackall
|
r14401 | for f, a, r, b in stats: | ||
maxfile = max(maxfile, encoding.colwidth(f)) | ||||
Steven Brown
|
r14437 | maxtotal = max(maxtotal, a + r) | ||
Matt Mackall
|
r14401 | addtotal += a | ||
removetotal += r | ||||
binary = binary or b | ||||
Steven Brown
|
r14437 | return maxfile, maxtotal, addtotal, removetotal, binary | ||
Matt Mackall
|
r14401 | |||
Alexander Solovyov
|
r7547 | def diffstatdata(lines): | ||
Gastón Kleiman
|
r13395 | diffre = re.compile('^diff .*-r [a-z0-9]+\s(.*)$') | ||
Matt Mackall
|
r14400 | results = [] | ||
Patrick Mezard
|
r15363 | filename, adds, removes, isbinary = None, 0, 0, False | ||
Matt Mackall
|
r14400 | |||
def addresult(): | ||||
if filename: | ||||
results.append((filename, adds, removes, isbinary)) | ||||
Alexander Solovyov
|
r7547 | for line in lines: | ||
if line.startswith('diff'): | ||||
Matt Mackall
|
r14400 | addresult() | ||
Alexander Solovyov
|
r7547 | # set numbers to 0 anyway when starting new file | ||
Patrick Mezard
|
r15363 | adds, removes, isbinary = 0, 0, False | ||
Sean Farley
|
r18830 | if line.startswith('diff --git a/'): | ||
Matt Mackall
|
r20972 | filename = gitre.search(line).group(2) | ||
Gastón Kleiman
|
r13395 | elif line.startswith('diff -r'): | ||
timeless
|
r8761 | # format: "diff -r ... -r ... filename" | ||
Gastón Kleiman
|
r13395 | filename = diffre.search(line).group(1) | ||
Jesus Espino Garcia
|
r15971 | elif line.startswith('+') and not line.startswith('+++ '): | ||
Alexander Solovyov
|
r7547 | adds += 1 | ||
Jesus Espino Garcia
|
r15971 | elif line.startswith('-') and not line.startswith('--- '): | ||
Alexander Solovyov
|
r7547 | removes += 1 | ||
Patrick Mezard
|
r15363 | elif (line.startswith('GIT binary patch') or | ||
line.startswith('Binary file')): | ||||
isbinary = True | ||||
Matt Mackall
|
r14400 | addresult() | ||
return results | ||||
Alexander Solovyov
|
r7547 | |||
Brodie Rao
|
r9642 | def diffstat(lines, width=80, git=False): | ||
Alexander Solovyov
|
r7547 | output = [] | ||
Matt Mackall
|
r14402 | stats = diffstatdata(lines) | ||
Steven Brown
|
r14437 | maxname, maxtotal, totaladds, totalremoves, hasbinary = diffstatsum(stats) | ||
Alexander Solovyov
|
r7547 | |||
countwidth = len(str(maxtotal)) | ||||
Brodie Rao
|
r9642 | if hasbinary and countwidth < 3: | ||
countwidth = 3 | ||||
Brodie Rao
|
r9330 | graphwidth = width - countwidth - maxname - 6 | ||
Alexander Solovyov
|
r7547 | if graphwidth < 10: | ||
graphwidth = 10 | ||||
Brodie Rao
|
r9330 | def scale(i): | ||
if maxtotal <= graphwidth: | ||||
return i | ||||
# If diffstat runs out of room it doesn't print anything, | ||||
# which isn't very useful, so always print at least one + or - | ||||
# if there were at least some changes. | ||||
return max(i * graphwidth // maxtotal, int(bool(i))) | ||||
Alexander Solovyov
|
r7547 | |||
Matt Mackall
|
r14402 | for filename, adds, removes, isbinary in stats: | ||
Patrick Mezard
|
r15363 | if isbinary: | ||
Brodie Rao
|
r9642 | count = 'Bin' | ||
else: | ||||
count = adds + removes | ||||
Brodie Rao
|
r9330 | pluses = '+' * scale(adds) | ||
minuses = '-' * scale(removes) | ||||
FUJIWARA Katsunori
|
r11611 | output.append(' %s%s | %*s %s%s\n' % | ||
Matt Mackall
|
r14402 | (filename, ' ' * (maxname - encoding.colwidth(filename)), | ||
countwidth, count, pluses, minuses)) | ||||
Alexander Solovyov
|
r7547 | |||
if stats: | ||||
Brodie Rao
|
r16683 | output.append(_(' %d files changed, %d insertions(+), ' | ||
'%d deletions(-)\n') | ||||
Matt Mackall
|
r7860 | % (len(stats), totaladds, totalremoves)) | ||
Alexander Solovyov
|
r7547 | |||
return ''.join(output) | ||||
Brodie Rao
|
r10818 | |||
def diffstatui(*args, **kw): | ||||
'''like diffstat(), but yields 2-tuples of (output, label) for | ||||
ui.write() | ||||
''' | ||||
for line in diffstat(*args, **kw).splitlines(): | ||||
if line and line[-1] in '+-': | ||||
name, graph = line.rsplit(' ', 1) | ||||
yield (name + ' ', '') | ||||
m = re.search(r'\++', graph) | ||||
if m: | ||||
yield (m.group(0), 'diffstat.inserted') | ||||
m = re.search(r'-+', graph) | ||||
if m: | ||||
yield (m.group(0), 'diffstat.deleted') | ||||
else: | ||||
yield (line, '') | ||||
yield ('\n', '') | ||||