patch.py
1868 lines
| 62.8 KiB
| text/x-python
|
PythonLexer
/ mercurial / patch.py
Brendan Cully
|
r2861 | # patch.py - patch file parsing routines | ||
# | ||||
Vadim Gelfer
|
r2865 | # Copyright 2006 Brendan Cully <brendan@kublai.com> | ||
Bryan O'Sullivan
|
r4897 | # Copyright 2007 Chris Mason <chris.mason@oracle.com> | ||
Vadim Gelfer
|
r2865 | # | ||
Martin Geisler
|
r8225 | # This software may be used and distributed according to the terms of the | ||
Matt Mackall
|
r10263 | # GNU General Public License version 2 or any later version. | ||
Brendan Cully
|
r2861 | |||
Adrian Buehlmann
|
r13112 | import cStringIO, email.Parser, os, errno, re | ||
Patrick Mezard
|
r14452 | import tempfile, zlib, shutil | ||
Augie Fackler
|
r10965 | |||
Matt Mackall
|
r3891 | from i18n import _ | ||
Joel Rosdahl
|
r6211 | from node import hex, nullid, short | ||
Patrick Mezard
|
r14611 | import base85, mdiff, scmutil, util, diffhelpers, copies, encoding, error | ||
import context | ||||
Vadim Gelfer
|
r2866 | |||
Dirkjan Ochtman
|
r7199 | gitre = re.compile('diff --git a/(.*) b/(.*)') | ||
Bryan O'Sullivan
|
r4897 | class PatchError(Exception): | ||
pass | ||||
Brendan Cully
|
r2933 | |||
# public functions | ||||
Brendan Cully
|
r10384 | def split(stream): | ||
'''return an iterator of individual patches from a stream''' | ||||
def isheader(line, inheader): | ||||
if inheader and line[0] in (' ', '\t'): | ||||
# continuation | ||||
return True | ||||
Peter Arrenbrecht
|
r10883 | if line[0] in (' ', '-', '+'): | ||
# diff line - don't check for header pattern in there | ||||
return False | ||||
Brendan Cully
|
r10384 | l = line.split(': ', 1) | ||
return len(l) == 2 and ' ' not in l[0] | ||||
def chunk(lines): | ||||
return cStringIO.StringIO(''.join(lines)) | ||||
def hgsplit(stream, cur): | ||||
inheader = True | ||||
for line in stream: | ||||
if not line.strip(): | ||||
inheader = False | ||||
if not inheader and line.startswith('# HG changeset patch'): | ||||
yield chunk(cur) | ||||
cur = [] | ||||
inheader = True | ||||
cur.append(line) | ||||
if cur: | ||||
yield chunk(cur) | ||||
def mboxsplit(stream, cur): | ||||
for line in stream: | ||||
if line.startswith('From '): | ||||
for c in split(chunk(cur[1:])): | ||||
yield c | ||||
cur = [] | ||||
cur.append(line) | ||||
if cur: | ||||
for c in split(chunk(cur[1:])): | ||||
yield c | ||||
def mimesplit(stream, cur): | ||||
def msgfp(m): | ||||
fp = cStringIO.StringIO() | ||||
g = email.Generator.Generator(fp, mangle_from_=False) | ||||
g.flatten(m) | ||||
fp.seek(0) | ||||
return fp | ||||
for line in stream: | ||||
cur.append(line) | ||||
c = chunk(cur) | ||||
m = email.Parser.Parser().parse(c) | ||||
if not m.is_multipart(): | ||||
yield msgfp(m) | ||||
else: | ||||
ok_types = ('text/plain', 'text/x-diff', 'text/x-patch') | ||||
for part in m.walk(): | ||||
ct = part.get_content_type() | ||||
if ct not in ok_types: | ||||
continue | ||||
yield msgfp(part) | ||||
def headersplit(stream, cur): | ||||
inheader = False | ||||
for line in stream: | ||||
if not inheader and isheader(line, inheader): | ||||
yield chunk(cur) | ||||
cur = [] | ||||
inheader = True | ||||
if inheader and not isheader(line, inheader): | ||||
inheader = False | ||||
cur.append(line) | ||||
if cur: | ||||
yield chunk(cur) | ||||
def remainder(cur): | ||||
yield chunk(cur) | ||||
class fiter(object): | ||||
def __init__(self, fp): | ||||
self.fp = fp | ||||
def __iter__(self): | ||||
return self | ||||
def next(self): | ||||
l = self.fp.readline() | ||||
if not l: | ||||
raise StopIteration | ||||
return l | ||||
inheader = False | ||||
cur = [] | ||||
mimeheaders = ['content-type'] | ||||
Augie Fackler
|
r14966 | if not util.safehasattr(stream, 'next'): | ||
Brendan Cully
|
r10384 | # http responses, for example, have readline but not next | ||
stream = fiter(stream) | ||||
for line in stream: | ||||
cur.append(line) | ||||
if line.startswith('# HG changeset patch'): | ||||
return hgsplit(stream, cur) | ||||
elif line.startswith('From '): | ||||
return mboxsplit(stream, cur) | ||||
elif isheader(line, inheader): | ||||
inheader = True | ||||
if line.split(':', 1)[0].lower() in mimeheaders: | ||||
# let email parser handle this | ||||
return mimesplit(stream, cur) | ||||
Brendan Cully
|
r10501 | elif line.startswith('--- ') and inheader: | ||
# No evil headers seen by diff start, split by hand | ||||
Brendan Cully
|
r10384 | return headersplit(stream, cur) | ||
# Not enough info, keep reading | ||||
# if we are here, we have a very plain patch | ||||
return remainder(cur) | ||||
Vadim Gelfer
|
r2866 | def extract(ui, fileobj): | ||
'''extract patch from data read from fileobj. | ||||
Brendan Cully
|
r4263 | patch can be a normal patch or contained in an email message. | ||
Vadim Gelfer
|
r2866 | |||
Dan Drake
|
r11645 | return tuple (filename, message, user, date, branch, node, p1, p2). | ||
Brendan Cully
|
r4263 | Any item in the returned tuple can be None. If filename is None, | ||
fileobj did not contain a patch. Caller must unlink filename when done.''' | ||||
Vadim Gelfer
|
r2866 | |||
# attempt to detect the start of a patch | ||||
# (this heuristic is borrowed from quilt) | ||||
Martin Geisler
|
r7736 | diffre = re.compile(r'^(?:Index:[ \t]|diff[ \t]|RCS file: |' | ||
r'retrieving revision [0-9]+(\.[0-9]+)*$|' | ||||
Benoit Boissinot
|
r10736 | r'---[ \t].*?^\+\+\+[ \t]|' | ||
r'\*\*\*[ \t].*?^---[ \t])', re.MULTILINE|re.DOTALL) | ||||
Vadim Gelfer
|
r2866 | |||
fd, tmpname = tempfile.mkstemp(prefix='hg-patch-') | ||||
tmpfp = os.fdopen(fd, 'w') | ||||
try: | ||||
msg = email.Parser.Parser().parse(fileobj) | ||||
Brendan Cully
|
r4777 | subject = msg['Subject'] | ||
Vadim Gelfer
|
r2866 | user = msg['From'] | ||
Patrick Mezard
|
r9573 | if not subject and not user: | ||
# Not an email, restore parsed headers if any | ||||
subject = '\n'.join(': '.join(h) for h in msg.items()) + '\n' | ||||
Patrick Mezard
|
r5418 | gitsendmail = 'git-send-email' in msg.get('X-Mailer', '') | ||
Vadim Gelfer
|
r2866 | # should try to parse msg['Date'] | ||
date = None | ||||
Brendan Cully
|
r4263 | nodeid = None | ||
Eric Hopper
|
r4443 | branch = None | ||
Brendan Cully
|
r4263 | parents = [] | ||
Vadim Gelfer
|
r2866 | |||
Brendan Cully
|
r4777 | if subject: | ||
if subject.startswith('[PATCH'): | ||||
pend = subject.find(']') | ||||
Brendan Cully
|
r4208 | if pend >= 0: | ||
Matt Mackall
|
r10282 | subject = subject[pend + 1:].lstrip() | ||
Steffen Daode Nurpmeso
|
r15158 | subject = re.sub(r'\n[ \t]+', ' ', subject) | ||
Brendan Cully
|
r4777 | ui.debug('Subject: %s\n' % subject) | ||
Vadim Gelfer
|
r2866 | if user: | ||
ui.debug('From: %s\n' % user) | ||||
diffs_seen = 0 | ||||
ok_types = ('text/plain', 'text/x-diff', 'text/x-patch') | ||||
Bryan O'Sullivan
|
r4900 | message = '' | ||
Vadim Gelfer
|
r2866 | for part in msg.walk(): | ||
content_type = part.get_content_type() | ||||
ui.debug('Content-Type: %s\n' % content_type) | ||||
if content_type not in ok_types: | ||||
continue | ||||
payload = part.get_payload(decode=True) | ||||
m = diffre.search(payload) | ||||
if m: | ||||
Brendan Cully
|
r4220 | hgpatch = False | ||
Mads Kiilerich
|
r12645 | hgpatchheader = False | ||
Brendan Cully
|
r4220 | ignoretext = False | ||
Martin Geisler
|
r9467 | ui.debug('found patch at byte %d\n' % m.start(0)) | ||
Vadim Gelfer
|
r2866 | diffs_seen += 1 | ||
cfp = cStringIO.StringIO() | ||||
for line in payload[:m.start(0)].splitlines(): | ||||
Mads Kiilerich
|
r12728 | if line.startswith('# HG changeset patch') and not hgpatch: | ||
Martin Geisler
|
r9467 | ui.debug('patch generated by hg export\n') | ||
Mads Kiilerich
|
r12728 | hgpatch = True | ||
Mads Kiilerich
|
r12645 | hgpatchheader = True | ||
Vadim Gelfer
|
r2866 | # drop earlier commit message content | ||
cfp.seek(0) | ||||
cfp.truncate() | ||||
Brendan Cully
|
r4778 | subject = None | ||
Mads Kiilerich
|
r12645 | elif hgpatchheader: | ||
Vadim Gelfer
|
r2866 | if line.startswith('# User '): | ||
user = line[7:] | ||||
ui.debug('From: %s\n' % user) | ||||
elif line.startswith("# Date "): | ||||
date = line[7:] | ||||
Eric Hopper
|
r4443 | elif line.startswith("# Branch "): | ||
branch = line[9:] | ||||
Brendan Cully
|
r4263 | elif line.startswith("# Node ID "): | ||
nodeid = line[10:] | ||||
elif line.startswith("# Parent "): | ||||
parents.append(line[10:]) | ||||
Mads Kiilerich
|
r12645 | elif not line.startswith("# "): | ||
hgpatchheader = False | ||||
Patrick Mezard
|
r5418 | elif line == '---' and gitsendmail: | ||
Brendan Cully
|
r4220 | ignoretext = True | ||
Mads Kiilerich
|
r12645 | if not hgpatchheader and not ignoretext: | ||
Vadim Gelfer
|
r2866 | cfp.write(line) | ||
cfp.write('\n') | ||||
message = cfp.getvalue() | ||||
if tmpfp: | ||||
tmpfp.write(payload) | ||||
if not payload.endswith('\n'): | ||||
tmpfp.write('\n') | ||||
elif not diffs_seen and message and content_type == 'text/plain': | ||||
message += '\n' + payload | ||||
except: | ||||
tmpfp.close() | ||||
os.unlink(tmpname) | ||||
raise | ||||
Brendan Cully
|
r4777 | if subject and not message.startswith(subject): | ||
message = '%s\n%s' % (subject, message) | ||||
Vadim Gelfer
|
r2866 | tmpfp.close() | ||
if not diffs_seen: | ||||
os.unlink(tmpname) | ||||
Eric Hopper
|
r4443 | return None, message, user, date, branch, None, None, None | ||
Brendan Cully
|
r4263 | p1 = parents and parents.pop(0) or None | ||
p2 = parents and parents.pop(0) or None | ||||
Eric Hopper
|
r4443 | return tmpname, message, user, date, branch, nodeid, p1, p2 | ||
Brendan Cully
|
r2861 | |||
Benoit Boissinot
|
r8778 | class patchmeta(object): | ||
Patrick Mezard
|
r7148 | """Patched file metadata | ||
'op' is the performed operation within ADD, DELETE, RENAME, MODIFY | ||||
or COPY. 'path' is patched file path. 'oldpath' is set to the | ||||
Patrick Mezard
|
r7149 | origin file when 'op' is either COPY or RENAME, None otherwise. If | ||
file mode is changed, 'mode' is a tuple (islink, isexec) where | ||||
'islink' is True if the file is a symlink and 'isexec' is True if | ||||
the file is executable. Otherwise, 'mode' is None. | ||||
Patrick Mezard
|
r7148 | """ | ||
def __init__(self, path): | ||||
self.path = path | ||||
self.oldpath = None | ||||
self.mode = None | ||||
self.op = 'MODIFY' | ||||
self.binary = False | ||||
Patrick Mezard
|
r7149 | def setmode(self, mode): | ||
islink = mode & 020000 | ||||
isexec = mode & 0100 | ||||
self.mode = (islink, isexec) | ||||
Patrick Mezard
|
r14566 | def copy(self): | ||
other = patchmeta(self.path) | ||||
other.oldpath = self.oldpath | ||||
other.mode = self.mode | ||||
other.op = self.op | ||||
other.binary = self.binary | ||||
return other | ||||
Mads Kiilerich
|
r11018 | def __repr__(self): | ||
return "<patchmeta %s %r>" % (self.op, self.path) | ||||
Patrick Mezard
|
r7152 | def readgitpatch(lr): | ||
Brendan Cully
|
r2861 | """extract git-style metadata about patches from <patchname>""" | ||
Thomas Arendsen Hein
|
r3223 | |||
Brendan Cully
|
r2861 | # Filter patch for git information | ||
gp = None | ||||
gitpatches = [] | ||||
Patrick Mezard
|
r7152 | for line in lr: | ||
Bill Barry
|
r9243 | line = line.rstrip(' \r\n') | ||
Brendan Cully
|
r2861 | if line.startswith('diff --git'): | ||
m = gitre.match(line) | ||||
if m: | ||||
if gp: | ||||
gitpatches.append(gp) | ||||
Nicolas Dumazet
|
r9392 | dst = m.group(2) | ||
Patrick Mezard
|
r7148 | gp = patchmeta(dst) | ||
Brendan Cully
|
r2861 | elif gp: | ||
if line.startswith('--- '): | ||||
gitpatches.append(gp) | ||||
gp = None | ||||
continue | ||||
if line.startswith('rename from '): | ||||
gp.op = 'RENAME' | ||||
Bill Barry
|
r9243 | gp.oldpath = line[12:] | ||
Brendan Cully
|
r2861 | elif line.startswith('rename to '): | ||
Bill Barry
|
r9243 | gp.path = line[10:] | ||
Brendan Cully
|
r2861 | elif line.startswith('copy from '): | ||
gp.op = 'COPY' | ||||
Bill Barry
|
r9243 | gp.oldpath = line[10:] | ||
Brendan Cully
|
r2861 | elif line.startswith('copy to '): | ||
Bill Barry
|
r9243 | gp.path = line[8:] | ||
Brendan Cully
|
r2861 | elif line.startswith('deleted file'): | ||
gp.op = 'DELETE' | ||||
elif line.startswith('new file mode '): | ||||
gp.op = 'ADD' | ||||
Bill Barry
|
r9243 | gp.setmode(int(line[-6:], 8)) | ||
Brendan Cully
|
r2861 | elif line.startswith('new mode '): | ||
Bill Barry
|
r9243 | gp.setmode(int(line[-6:], 8)) | ||
Brendan Cully
|
r3367 | elif line.startswith('GIT binary patch'): | ||
gp.binary = True | ||||
Brendan Cully
|
r2861 | if gp: | ||
gitpatches.append(gp) | ||||
Patrick Mezard
|
r12669 | return gitpatches | ||
Brendan Cully
|
r2861 | |||
Simon Heimberg
|
r8891 | class linereader(object): | ||
Patrick Mezard
|
r8810 | # simple class to allow pushing lines back into the input stream | ||
Patrick Mezard
|
r14418 | def __init__(self, fp): | ||
Patrick Mezard
|
r8810 | self.fp = fp | ||
self.buf = [] | ||||
def push(self, line): | ||||
if line is not None: | ||||
self.buf.append(line) | ||||
def readline(self): | ||||
if self.buf: | ||||
l = self.buf[0] | ||||
del self.buf[0] | ||||
return l | ||||
Patrick Mezard
|
r14418 | return self.fp.readline() | ||
Patrick Mezard
|
r8810 | |||
def __iter__(self): | ||||
Martin Geisler
|
r14494 | while True: | ||
Patrick Mezard
|
r8810 | l = self.readline() | ||
if not l: | ||||
break | ||||
yield l | ||||
Patrick Mezard
|
r14348 | class abstractbackend(object): | ||
def __init__(self, ui): | ||||
Bryan O'Sullivan
|
r4897 | self.ui = ui | ||
Patrick Mezard
|
r14348 | |||
Patrick Mezard
|
r14391 | def getfile(self, fname): | ||
"""Return target file data and flags as a (data, (islink, | ||||
isexec)) tuple. | ||||
Patrick Mezard
|
r14348 | """ | ||
raise NotImplementedError | ||||
Patrick Mezard
|
r14452 | def setfile(self, fname, data, mode, copysource): | ||
Patrick Mezard
|
r14391 | """Write data to target file fname and set its mode. mode is a | ||
(islink, isexec) tuple. If data is None, the file content should | ||||
Patrick Mezard
|
r14452 | be left unchanged. If the file is modified after being copied, | ||
copysource is set to the original file name. | ||||
Patrick Mezard
|
r14367 | """ | ||
Patrick Mezard
|
r14348 | raise NotImplementedError | ||
Patrick Mezard
|
r5652 | |||
Patrick Mezard
|
r14348 | def unlink(self, fname): | ||
"""Unlink target file.""" | ||||
raise NotImplementedError | ||||
def writerej(self, fname, failed, total, lines): | ||||
"""Write rejected lines for fname. total is the number of hunks | ||||
which failed to apply and total the total number of hunks for this | ||||
files. | ||||
""" | ||||
pass | ||||
Patrick Mezard
|
r14351 | def exists(self, fname): | ||
raise NotImplementedError | ||||
Patrick Mezard
|
r14348 | class fsbackend(abstractbackend): | ||
Patrick Mezard
|
r14350 | def __init__(self, ui, basedir): | ||
Patrick Mezard
|
r14348 | super(fsbackend, self).__init__(ui) | ||
Patrick Mezard
|
r14350 | self.opener = scmutil.opener(basedir) | ||
Bryan O'Sullivan
|
r4897 | |||
Patrick Mezard
|
r14366 | def _join(self, f): | ||
return os.path.join(self.opener.base, f) | ||||
Patrick Mezard
|
r14391 | def getfile(self, fname): | ||
path = self._join(fname) | ||||
if os.path.islink(path): | ||||
return (os.readlink(path), (True, False)) | ||||
Patrick Mezard
|
r14531 | isexec = False | ||
Patrick Mezard
|
r7392 | try: | ||
Patrick Mezard
|
r14391 | isexec = os.lstat(path).st_mode & 0100 != 0 | ||
except OSError, e: | ||||
if e.errno != errno.ENOENT: | ||||
raise | ||||
Patrick Mezard
|
r14531 | return (self.opener.read(fname), (False, isexec)) | ||
Patrick Mezard
|
r7392 | |||
Patrick Mezard
|
r14452 | def setfile(self, fname, data, mode, copysource): | ||
Patrick Mezard
|
r14391 | islink, isexec = mode | ||
if data is None: | ||||
util.setflags(self._join(fname), islink, isexec) | ||||
Patrick Mezard
|
r14390 | return | ||
Patrick Mezard
|
r14391 | if islink: | ||
self.opener.symlink(data, fname) | ||||
Patrick Mezard
|
r14367 | else: | ||
Patrick Mezard
|
r14391 | self.opener.write(fname, data) | ||
Patrick Mezard
|
r14367 | if isexec: | ||
util.setflags(self._join(fname), False, True) | ||||
Patrick Mezard
|
r7392 | |||
def unlink(self, fname): | ||||
Patrick Mezard
|
r14368 | try: | ||
util.unlinkpath(self._join(fname)) | ||||
except OSError, inst: | ||||
if inst.errno != errno.ENOENT: | ||||
raise | ||||
Patrick Mezard
|
r7392 | |||
Patrick Mezard
|
r14348 | def writerej(self, fname, failed, total, lines): | ||
fname = fname + ".rej" | ||||
self.ui.warn( | ||||
_("%d out of %d hunks FAILED -- saving rejects to file %s\n") % | ||||
(failed, total, fname)) | ||||
fp = self.opener(fname, 'w') | ||||
fp.writelines(lines) | ||||
fp.close() | ||||
Patrick Mezard
|
r14351 | def exists(self, fname): | ||
Patrick Mezard
|
r14366 | return os.path.lexists(self._join(fname)) | ||
Patrick Mezard
|
r14351 | |||
Patrick Mezard
|
r14370 | class workingbackend(fsbackend): | ||
def __init__(self, ui, repo, similarity): | ||||
super(workingbackend, self).__init__(ui, repo.root) | ||||
self.repo = repo | ||||
self.similarity = similarity | ||||
self.removed = set() | ||||
self.changed = set() | ||||
self.copied = [] | ||||
Patrick Mezard
|
r14453 | def _checkknown(self, fname): | ||
if self.repo.dirstate[fname] == '?' and self.exists(fname): | ||||
raise PatchError(_('cannot patch %s: file is not tracked') % fname) | ||||
Patrick Mezard
|
r14452 | def setfile(self, fname, data, mode, copysource): | ||
Patrick Mezard
|
r14453 | self._checkknown(fname) | ||
Patrick Mezard
|
r14452 | super(workingbackend, self).setfile(fname, data, mode, copysource) | ||
if copysource is not None: | ||||
self.copied.append((copysource, fname)) | ||||
Patrick Mezard
|
r14370 | self.changed.add(fname) | ||
def unlink(self, fname): | ||||
Patrick Mezard
|
r14453 | self._checkknown(fname) | ||
Patrick Mezard
|
r14370 | super(workingbackend, self).unlink(fname) | ||
self.removed.add(fname) | ||||
self.changed.add(fname) | ||||
def close(self): | ||||
wctx = self.repo[None] | ||||
addremoved = set(self.changed) | ||||
for src, dst in self.copied: | ||||
scmutil.dirstatecopy(self.ui, self.repo, wctx, src, dst) | ||||
Patrick Mezard
|
r16112 | if self.removed: | ||
Matt Mackall
|
r14435 | wctx.forget(sorted(self.removed)) | ||
Patrick Mezard
|
r16112 | for f in self.removed: | ||
if f not in self.repo.dirstate: | ||||
# File was deleted and no longer belongs to the | ||||
# dirstate, it was probably marked added then | ||||
# deleted, and should not be considered by | ||||
# addremove(). | ||||
addremoved.discard(f) | ||||
Patrick Mezard
|
r14370 | if addremoved: | ||
cwd = self.repo.getcwd() | ||||
if cwd: | ||||
addremoved = [util.pathto(self.repo.root, cwd, f) | ||||
for f in addremoved] | ||||
scmutil.addremove(self.repo, addremoved, similarity=self.similarity) | ||||
return sorted(self.changed) | ||||
Patrick Mezard
|
r14452 | class filestore(object): | ||
Patrick Mezard
|
r14658 | def __init__(self, maxsize=None): | ||
Patrick Mezard
|
r14452 | self.opener = None | ||
self.files = {} | ||||
self.created = 0 | ||||
Patrick Mezard
|
r14658 | self.maxsize = maxsize | ||
if self.maxsize is None: | ||||
self.maxsize = 4*(2**20) | ||||
self.size = 0 | ||||
self.data = {} | ||||
Patrick Mezard
|
r14452 | |||
Patrick Mezard
|
r14609 | def setfile(self, fname, data, mode, copied=None): | ||
Patrick Mezard
|
r14658 | if self.maxsize < 0 or (len(data) + self.size) <= self.maxsize: | ||
self.data[fname] = (data, mode, copied) | ||||
self.size += len(data) | ||||
else: | ||||
if self.opener is None: | ||||
root = tempfile.mkdtemp(prefix='hg-patch-') | ||||
self.opener = scmutil.opener(root) | ||||
# Avoid filename issues with these simple names | ||||
fn = str(self.created) | ||||
self.opener.write(fn, data) | ||||
self.created += 1 | ||||
self.files[fname] = (fn, mode, copied) | ||||
Patrick Mezard
|
r14452 | |||
def getfile(self, fname): | ||||
Patrick Mezard
|
r14658 | if fname in self.data: | ||
return self.data[fname] | ||||
if not self.opener or fname not in self.files: | ||||
Patrick Mezard
|
r14452 | raise IOError() | ||
Patrick Mezard
|
r14609 | fn, mode, copied = self.files[fname] | ||
return self.opener.read(fn), mode, copied | ||||
Patrick Mezard
|
r14452 | |||
def close(self): | ||||
if self.opener: | ||||
shutil.rmtree(self.opener.base) | ||||
Patrick Mezard
|
r14611 | class repobackend(abstractbackend): | ||
def __init__(self, ui, repo, ctx, store): | ||||
super(repobackend, self).__init__(ui) | ||||
self.repo = repo | ||||
self.ctx = ctx | ||||
self.store = store | ||||
self.changed = set() | ||||
self.removed = set() | ||||
self.copied = {} | ||||
def _checkknown(self, fname): | ||||
if fname not in self.ctx: | ||||
raise PatchError(_('cannot patch %s: file is not tracked') % fname) | ||||
def getfile(self, fname): | ||||
try: | ||||
fctx = self.ctx[fname] | ||||
except error.LookupError: | ||||
raise IOError() | ||||
flags = fctx.flags() | ||||
return fctx.data(), ('l' in flags, 'x' in flags) | ||||
def setfile(self, fname, data, mode, copysource): | ||||
if copysource: | ||||
self._checkknown(copysource) | ||||
if data is None: | ||||
data = self.ctx[fname].data() | ||||
self.store.setfile(fname, data, mode, copysource) | ||||
self.changed.add(fname) | ||||
if copysource: | ||||
self.copied[fname] = copysource | ||||
def unlink(self, fname): | ||||
self._checkknown(fname) | ||||
self.removed.add(fname) | ||||
def exists(self, fname): | ||||
return fname in self.ctx | ||||
def close(self): | ||||
return self.changed | self.removed | ||||
Patrick Mezard
|
r14348 | # @@ -start,len +start,len @@ or @@ -start +start @@ if len is 1 | ||
Patrick Mezard
|
r15510 | unidesc = re.compile('@@ -(\d+)(?:,(\d+))? \+(\d+)(?:,(\d+))? @@') | ||
contextdesc = re.compile('(?:---|\*\*\*) (\d+)(?:,(\d+))? (?:---|\*\*\*)') | ||||
Patrick Mezard
|
r14348 | eolmodes = ['strict', 'crlf', 'lf', 'auto'] | ||
class patchfile(object): | ||||
Patrick Mezard
|
r14566 | def __init__(self, ui, gp, backend, store, eolmode='strict'): | ||
self.fname = gp.path | ||||
Patrick Mezard
|
r14348 | self.eolmode = eolmode | ||
self.eol = None | ||||
self.backend = backend | ||||
self.ui = ui | ||||
self.lines = [] | ||||
self.exists = False | ||||
Patrick Mezard
|
r14452 | self.missing = True | ||
Patrick Mezard
|
r14566 | self.mode = gp.mode | ||
self.copysource = gp.oldpath | ||||
self.create = gp.op in ('ADD', 'COPY', 'RENAME') | ||||
self.remove = gp.op == 'DELETE' | ||||
Patrick Mezard
|
r14452 | try: | ||
Patrick Mezard
|
r14566 | if self.copysource is None: | ||
data, mode = backend.getfile(self.fname) | ||||
Patrick Mezard
|
r14348 | self.exists = True | ||
Patrick Mezard
|
r14452 | else: | ||
Patrick Mezard
|
r14609 | data, mode = store.getfile(self.copysource)[:2] | ||
Patrick Mezard
|
r14566 | self.exists = backend.exists(self.fname) | ||
Patrick Mezard
|
r14452 | self.missing = False | ||
if data: | ||||
Wagner Bruna
|
r14832 | self.lines = mdiff.splitnewlines(data) | ||
Patrick Mezard
|
r14452 | if self.mode is None: | ||
self.mode = mode | ||||
if self.lines: | ||||
# Normalize line endings | ||||
if self.lines[0].endswith('\r\n'): | ||||
self.eol = '\r\n' | ||||
elif self.lines[0].endswith('\n'): | ||||
self.eol = '\n' | ||||
if eolmode != 'strict': | ||||
nlines = [] | ||||
for l in self.lines: | ||||
if l.endswith('\r\n'): | ||||
l = l[:-2] + '\n' | ||||
nlines.append(l) | ||||
self.lines = nlines | ||||
except IOError: | ||||
Patrick Mezard
|
r14566 | if self.create: | ||
Patrick Mezard
|
r14452 | self.missing = False | ||
if self.mode is None: | ||||
self.mode = (False, False) | ||||
if self.missing: | ||||
self.ui.warn(_("unable to find '%s' for patching\n") % self.fname) | ||||
Patrick Mezard
|
r14348 | |||
self.hash = {} | ||||
self.dirty = 0 | ||||
self.offset = 0 | ||||
self.skew = 0 | ||||
self.rej = [] | ||||
self.fileprinted = False | ||||
self.printfile(False) | ||||
self.hunks = 0 | ||||
Patrick Mezard
|
r14367 | def writelines(self, fname, lines, mode): | ||
Patrick Mezard
|
r14348 | if self.eolmode == 'auto': | ||
eol = self.eol | ||||
elif self.eolmode == 'crlf': | ||||
eol = '\r\n' | ||||
else: | ||||
eol = '\n' | ||||
if self.eolmode != 'strict' and eol and eol != '\n': | ||||
rawlines = [] | ||||
for l in lines: | ||||
if l and l[-1] == '\n': | ||||
l = l[:-1] + eol | ||||
rawlines.append(l) | ||||
lines = rawlines | ||||
Patrick Mezard
|
r14452 | self.backend.setfile(fname, ''.join(lines), mode, self.copysource) | ||
Patrick Mezard
|
r14348 | |||
Bryan O'Sullivan
|
r4897 | def printfile(self, warn): | ||
if self.fileprinted: | ||||
return | ||||
if warn or self.ui.verbose: | ||||
self.fileprinted = True | ||||
Bryan O'Sullivan
|
r4898 | s = _("patching file %s\n") % self.fname | ||
Bryan O'Sullivan
|
r4897 | if warn: | ||
self.ui.warn(s) | ||||
else: | ||||
self.ui.note(s) | ||||
def findlines(self, l, linenum): | ||||
# looks through the hash and finds candidate lines. The | ||||
# result is a list of line numbers sorted based on distance | ||||
# from linenum | ||||
Thomas Arendsen Hein
|
r5143 | |||
Benoit Boissinot
|
r9681 | cand = self.hash.get(l, []) | ||
Bryan O'Sullivan
|
r4897 | if len(cand) > 1: | ||
# resort our list of potentials forward then back. | ||||
Alejandro Santos
|
r9032 | cand.sort(key=lambda x: abs(x - linenum)) | ||
Bryan O'Sullivan
|
r4897 | return cand | ||
def write_rej(self): | ||||
# our rejects are a little different from patch(1). This always | ||||
# creates rejects in the same form as the original patch. A file | ||||
# header is inserted so that you can run the reject through patch again | ||||
# without having to type the filename. | ||||
if not self.rej: | ||||
return | ||||
Patrick Mezard
|
r14349 | base = os.path.basename(self.fname) | ||
lines = ["--- %s\n+++ %s\n" % (base, base)] | ||||
for x in self.rej: | ||||
for l in x.hunk: | ||||
lines.append(l) | ||||
if l[-1] != '\n': | ||||
lines.append("\n\ No newline at end of file\n") | ||||
self.backend.writerej(self.fname, len(self.rej), self.hunks, lines) | ||||
Bryan O'Sullivan
|
r4897 | |||
Nicolas Dumazet
|
r9393 | def apply(self, h): | ||
Bryan O'Sullivan
|
r4897 | if not h.complete(): | ||
Bryan O'Sullivan
|
r4898 | raise PatchError(_("bad hunk #%d %s (%d %d %d %d)") % | ||
Bryan O'Sullivan
|
r4897 | (h.number, h.desc, len(h.a), h.lena, len(h.b), | ||
h.lenb)) | ||||
self.hunks += 1 | ||||
Patrick Mezard
|
r5652 | if self.missing: | ||
self.rej.append(h) | ||||
return -1 | ||||
Patrick Mezard
|
r14451 | if self.exists and self.create: | ||
Patrick Mezard
|
r14452 | if self.copysource: | ||
self.ui.warn(_("cannot create %s: destination already " | ||||
"exists\n" % self.fname)) | ||||
else: | ||||
self.ui.warn(_("file %s already exists\n") % self.fname) | ||||
Bryan O'Sullivan
|
r4897 | self.rej.append(h) | ||
return -1 | ||||
Patrick Mezard
|
r9585 | if isinstance(h, binhunk): | ||
Patrick Mezard
|
r14451 | if self.remove: | ||
Patrick Mezard
|
r14348 | self.backend.unlink(self.fname) | ||
Bryan O'Sullivan
|
r4897 | else: | ||
self.lines[:] = h.new() | ||||
self.offset += len(h.new()) | ||||
Martin Geisler
|
r14217 | self.dirty = True | ||
Bryan O'Sullivan
|
r4897 | return 0 | ||
Patrick Mezard
|
r10127 | horig = h | ||
Patrick Mezard
|
r10128 | if (self.eolmode in ('crlf', 'lf') | ||
or self.eolmode == 'auto' and self.eol): | ||||
# If new eols are going to be normalized, then normalize | ||||
# hunk data before patching. Otherwise, preserve input | ||||
# line-endings. | ||||
Patrick Mezard
|
r10127 | h = h.getnormalized() | ||
Bryan O'Sullivan
|
r4897 | # fast case first, no offsets, no fuzz | ||
Patrick Mezard
|
r16122 | old, oldstart, new, newstart = h.fuzzit(0, False) | ||
oldstart += self.offset | ||||
orig_start = oldstart | ||||
Greg Onufer
|
r10135 | # if there's skew we want to emit the "(offset %d lines)" even | ||
# when the hunk cleanly applies at start + skew, so skip the | ||||
# fast case code | ||||
Patrick Mezard
|
r16122 | if (self.skew == 0 and | ||
diffhelpers.testhunk(old, self.lines, oldstart) == 0): | ||||
Patrick Mezard
|
r14451 | if self.remove: | ||
Patrick Mezard
|
r14348 | self.backend.unlink(self.fname) | ||
Bryan O'Sullivan
|
r4897 | else: | ||
Patrick Mezard
|
r16122 | self.lines[oldstart:oldstart + len(old)] = new | ||
self.offset += len(new) - len(old) | ||||
Martin Geisler
|
r14217 | self.dirty = True | ||
Bryan O'Sullivan
|
r4897 | return 0 | ||
Patrick Mezard
|
r13700 | # ok, we couldn't match the hunk. Lets look for offsets and fuzz it | ||
self.hash = {} | ||||
for x, s in enumerate(self.lines): | ||||
self.hash.setdefault(s, []).append(x) | ||||
Bryan O'Sullivan
|
r4897 | |||
for fuzzlen in xrange(3): | ||||
Matt Mackall
|
r10282 | for toponly in [True, False]: | ||
Patrick Mezard
|
r16122 | old, oldstart, new, newstart = h.fuzzit(fuzzlen, toponly) | ||
Patrick Mezard
|
r16123 | oldstart = oldstart + self.offset + self.skew | ||
oldstart = min(oldstart, len(self.lines)) | ||||
if old: | ||||
cand = self.findlines(old[0][1:], oldstart) | ||||
else: | ||||
# Only adding lines with no or fuzzed context, just | ||||
# take the skew in account | ||||
cand = [oldstart] | ||||
Bryan O'Sullivan
|
r4897 | |||
for l in cand: | ||||
Patrick Mezard
|
r16123 | if not old or diffhelpers.testhunk(old, self.lines, l) == 0: | ||
Patrick Mezard
|
r16121 | self.lines[l : l + len(old)] = new | ||
self.offset += len(new) - len(old) | ||||
Greg Onufer
|
r10135 | self.skew = l - orig_start | ||
Martin Geisler
|
r14217 | self.dirty = True | ||
Wagner Bruna
|
r10518 | offset = l - orig_start - fuzzlen | ||
Bryan O'Sullivan
|
r4897 | if fuzzlen: | ||
Wagner Bruna
|
r10518 | msg = _("Hunk #%d succeeded at %d " | ||
"with fuzz %d " | ||||
"(offset %d lines).\n") | ||||
Bryan O'Sullivan
|
r4897 | self.printfile(True) | ||
Wagner Bruna
|
r10518 | self.ui.warn(msg % | ||
(h.number, l + 1, fuzzlen, offset)) | ||||
Bryan O'Sullivan
|
r4897 | else: | ||
Wagner Bruna
|
r10518 | msg = _("Hunk #%d succeeded at %d " | ||
Wagner Bruna
|
r8090 | "(offset %d lines).\n") | ||
Wagner Bruna
|
r10518 | self.ui.note(msg % (h.number, l + 1, offset)) | ||
Bryan O'Sullivan
|
r4897 | return fuzzlen | ||
self.printfile(True) | ||||
Bryan O'Sullivan
|
r4898 | self.ui.warn(_("Hunk #%d FAILED at %d\n") % (h.number, orig_start)) | ||
Patrick Mezard
|
r10127 | self.rej.append(horig) | ||
Bryan O'Sullivan
|
r4897 | return -1 | ||
Patrick Mezard
|
r13701 | def close(self): | ||
if self.dirty: | ||||
Patrick Mezard
|
r14367 | self.writelines(self.fname, self.lines, self.mode) | ||
Patrick Mezard
|
r13701 | self.write_rej() | ||
return len(self.rej) | ||||
Benoit Boissinot
|
r8778 | class hunk(object): | ||
Patrick Mezard
|
r14451 | def __init__(self, desc, num, lr, context): | ||
Bryan O'Sullivan
|
r4897 | self.number = num | ||
self.desc = desc | ||||
Matt Mackall
|
r10282 | self.hunk = [desc] | ||
Bryan O'Sullivan
|
r4897 | self.a = [] | ||
self.b = [] | ||||
Benoit Boissinot
|
r9682 | self.starta = self.lena = None | ||
self.startb = self.lenb = None | ||||
Patrick Mezard
|
r10127 | if lr is not None: | ||
if context: | ||||
self.read_context_hunk(lr) | ||||
else: | ||||
self.read_unified_hunk(lr) | ||||
Bryan O'Sullivan
|
r4897 | |||
Patrick Mezard
|
r10127 | def getnormalized(self): | ||
"""Return a copy with line endings normalized to LF.""" | ||||
def normalize(lines): | ||||
nlines = [] | ||||
for line in lines: | ||||
if line.endswith('\r\n'): | ||||
line = line[:-2] + '\n' | ||||
nlines.append(line) | ||||
return nlines | ||||
# Dummy object, it is rebuilt manually | ||||
Patrick Mezard
|
r14451 | nh = hunk(self.desc, self.number, None, None) | ||
Patrick Mezard
|
r10127 | nh.number = self.number | ||
nh.desc = self.desc | ||||
Patrick Mezard
|
r10524 | nh.hunk = self.hunk | ||
Patrick Mezard
|
r10127 | nh.a = normalize(self.a) | ||
nh.b = normalize(self.b) | ||||
nh.starta = self.starta | ||||
nh.startb = self.startb | ||||
nh.lena = self.lena | ||||
nh.lenb = self.lenb | ||||
return nh | ||||
Bryan O'Sullivan
|
r4897 | def read_unified_hunk(self, lr): | ||
m = unidesc.match(self.desc) | ||||
if not m: | ||||
Bryan O'Sullivan
|
r4898 | raise PatchError(_("bad hunk #%d") % self.number) | ||
Patrick Mezard
|
r15510 | self.starta, self.lena, self.startb, self.lenb = m.groups() | ||
Martin Geisler
|
r8527 | if self.lena is None: | ||
Bryan O'Sullivan
|
r4897 | self.lena = 1 | ||
else: | ||||
self.lena = int(self.lena) | ||||
Martin Geisler
|
r8527 | if self.lenb is None: | ||
Bryan O'Sullivan
|
r4897 | self.lenb = 1 | ||
else: | ||||
self.lenb = int(self.lenb) | ||||
self.starta = int(self.starta) | ||||
self.startb = int(self.startb) | ||||
Patrick Mezard
|
r7152 | diffhelpers.addlines(lr, self.hunk, self.lena, self.lenb, self.a, self.b) | ||
Bryan O'Sullivan
|
r4897 | # if we hit eof before finishing out the hunk, the last line will | ||
# be zero length. Lets try to fix it up. | ||||
while len(self.hunk[-1]) == 0: | ||||
Dirkjan Ochtman
|
r6948 | del self.hunk[-1] | ||
del self.a[-1] | ||||
del self.b[-1] | ||||
self.lena -= 1 | ||||
self.lenb -= 1 | ||||
Patrick Mezard
|
r13699 | self._fixnewline(lr) | ||
Bryan O'Sullivan
|
r4897 | |||
def read_context_hunk(self, lr): | ||||
self.desc = lr.readline() | ||||
m = contextdesc.match(self.desc) | ||||
if not m: | ||||
Bryan O'Sullivan
|
r4898 | raise PatchError(_("bad hunk #%d") % self.number) | ||
Patrick Mezard
|
r15510 | self.starta, aend = m.groups() | ||
Bryan O'Sullivan
|
r4897 | self.starta = int(self.starta) | ||
Martin Geisler
|
r8527 | if aend is None: | ||
Bryan O'Sullivan
|
r4897 | aend = self.starta | ||
self.lena = int(aend) - self.starta | ||||
if self.starta: | ||||
self.lena += 1 | ||||
for x in xrange(self.lena): | ||||
l = lr.readline() | ||||
if l.startswith('---'): | ||||
Patrick Mezard
|
r12825 | # lines addition, old block is empty | ||
Bryan O'Sullivan
|
r4897 | lr.push(l) | ||
break | ||||
s = l[2:] | ||||
if l.startswith('- ') or l.startswith('! '): | ||||
u = '-' + s | ||||
elif l.startswith(' '): | ||||
u = ' ' + s | ||||
else: | ||||
Bryan O'Sullivan
|
r4898 | raise PatchError(_("bad hunk #%d old text line %d") % | ||
(self.number, x)) | ||||
Bryan O'Sullivan
|
r4897 | self.a.append(u) | ||
self.hunk.append(u) | ||||
l = lr.readline() | ||||
if l.startswith('\ '): | ||||
s = self.a[-1][:-1] | ||||
self.a[-1] = s | ||||
self.hunk[-1] = s | ||||
l = lr.readline() | ||||
m = contextdesc.match(l) | ||||
if not m: | ||||
Bryan O'Sullivan
|
r4898 | raise PatchError(_("bad hunk #%d") % self.number) | ||
Patrick Mezard
|
r15510 | self.startb, bend = m.groups() | ||
Bryan O'Sullivan
|
r4897 | self.startb = int(self.startb) | ||
Martin Geisler
|
r8527 | if bend is None: | ||
Bryan O'Sullivan
|
r4897 | bend = self.startb | ||
self.lenb = int(bend) - self.startb | ||||
if self.startb: | ||||
self.lenb += 1 | ||||
hunki = 1 | ||||
for x in xrange(self.lenb): | ||||
l = lr.readline() | ||||
if l.startswith('\ '): | ||||
Patrick Mezard
|
r12825 | # XXX: the only way to hit this is with an invalid line range. | ||
# The no-eol marker is not counted in the line range, but I | ||||
# guess there are diff(1) out there which behave differently. | ||||
Bryan O'Sullivan
|
r4897 | s = self.b[-1][:-1] | ||
self.b[-1] = s | ||||
Matt Mackall
|
r10282 | self.hunk[hunki - 1] = s | ||
Bryan O'Sullivan
|
r4897 | continue | ||
if not l: | ||||
Patrick Mezard
|
r12825 | # line deletions, new block is empty and we hit EOF | ||
Bryan O'Sullivan
|
r4897 | lr.push(l) | ||
break | ||||
s = l[2:] | ||||
if l.startswith('+ ') or l.startswith('! '): | ||||
u = '+' + s | ||||
elif l.startswith(' '): | ||||
u = ' ' + s | ||||
elif len(self.b) == 0: | ||||
Patrick Mezard
|
r12825 | # line deletions, new block is empty | ||
Bryan O'Sullivan
|
r4897 | lr.push(l) | ||
break | ||||
else: | ||||
Bryan O'Sullivan
|
r4898 | raise PatchError(_("bad hunk #%d old text line %d") % | ||
(self.number, x)) | ||||
Bryan O'Sullivan
|
r4897 | self.b.append(s) | ||
while True: | ||||
if hunki >= len(self.hunk): | ||||
h = "" | ||||
else: | ||||
h = self.hunk[hunki] | ||||
hunki += 1 | ||||
if h == u: | ||||
break | ||||
elif h.startswith('-'): | ||||
continue | ||||
else: | ||||
Matt Mackall
|
r10282 | self.hunk.insert(hunki - 1, u) | ||
Bryan O'Sullivan
|
r4897 | break | ||
if not self.a: | ||||
# this happens when lines were only added to the hunk | ||||
for x in self.hunk: | ||||
if x.startswith('-') or x.startswith(' '): | ||||
self.a.append(x) | ||||
if not self.b: | ||||
# this happens when lines were only deleted from the hunk | ||||
for x in self.hunk: | ||||
if x.startswith('+') or x.startswith(' '): | ||||
self.b.append(x[1:]) | ||||
# @@ -start,len +start,len @@ | ||||
self.desc = "@@ -%d,%d +%d,%d @@\n" % (self.starta, self.lena, | ||||
self.startb, self.lenb) | ||||
self.hunk[0] = self.desc | ||||
Patrick Mezard
|
r13699 | self._fixnewline(lr) | ||
Bryan O'Sullivan
|
r4897 | |||
Patrick Mezard
|
r13699 | def _fixnewline(self, lr): | ||
l = lr.readline() | ||||
if l.startswith('\ '): | ||||
diffhelpers.fix_newline(self.hunk, self.a, self.b) | ||||
else: | ||||
lr.push(l) | ||||
Bryan O'Sullivan
|
r4897 | |||
def complete(self): | ||||
return len(self.a) == self.lena and len(self.b) == self.lenb | ||||
Patrick Mezard
|
r16121 | def _fuzzit(self, old, new, fuzz, toponly): | ||
Bryan O'Sullivan
|
r4897 | # this removes context lines from the top and bottom of list 'l'. It | ||
# checks the hunk to make sure only context lines are removed, and then | ||||
# returns a new shortened list of lines. | ||||
Patrick Mezard
|
r16124 | fuzz = min(fuzz, len(old)) | ||
Bryan O'Sullivan
|
r4897 | if fuzz: | ||
top = 0 | ||||
bot = 0 | ||||
hlen = len(self.hunk) | ||||
Matt Mackall
|
r10282 | for x in xrange(hlen - 1): | ||
Bryan O'Sullivan
|
r4897 | # the hunk starts with the @@ line, so use x+1 | ||
Matt Mackall
|
r10282 | if self.hunk[x + 1][0] == ' ': | ||
Bryan O'Sullivan
|
r4897 | top += 1 | ||
else: | ||||
break | ||||
if not toponly: | ||||
Matt Mackall
|
r10282 | for x in xrange(hlen - 1): | ||
if self.hunk[hlen - bot - 1][0] == ' ': | ||||
Bryan O'Sullivan
|
r4897 | bot += 1 | ||
else: | ||||
break | ||||
Patrick Mezard
|
r16124 | bot = min(fuzz, bot) | ||
top = min(fuzz, top) | ||||
Patrick Mezard
|
r16122 | return old[top:len(old)-bot], new[top:len(new)-bot], top | ||
return old, new, 0 | ||||
Bryan O'Sullivan
|
r4897 | |||
Patrick Mezard
|
r16121 | def fuzzit(self, fuzz, toponly): | ||
Patrick Mezard
|
r16122 | old, new, top = self._fuzzit(self.a, self.b, fuzz, toponly) | ||
oldstart = self.starta + top | ||||
newstart = self.startb + top | ||||
# zero length hunk ranges already have their start decremented | ||||
if self.lena: | ||||
oldstart -= 1 | ||||
if self.lenb: | ||||
newstart -= 1 | ||||
return old, oldstart, new, newstart | ||||
Bryan O'Sullivan
|
r4897 | |||
Thomas Arendsen Hein
|
r14764 | class binhunk(object): | ||
Patrick Mezard
|
r9585 | 'A binary patch file. Only understands literals so far.' | ||
Patrick Mezard
|
r14451 | def __init__(self, lr): | ||
Bryan O'Sullivan
|
r4897 | self.text = None | ||
Patrick Mezard
|
r9585 | self.hunk = ['GIT binary patch\n'] | ||
Patrick Mezard
|
r14384 | self._read(lr) | ||
Bryan O'Sullivan
|
r4897 | |||
def complete(self): | ||||
return self.text is not None | ||||
def new(self): | ||||
return [self.text] | ||||
Patrick Mezard
|
r14384 | def _read(self, lr): | ||
Patrick Mezard
|
r7153 | line = lr.readline() | ||
Bryan O'Sullivan
|
r4897 | self.hunk.append(line) | ||
Brendan Cully
|
r3367 | while line and not line.startswith('literal '): | ||
Patrick Mezard
|
r7153 | line = lr.readline() | ||
Bryan O'Sullivan
|
r4897 | self.hunk.append(line) | ||
Brendan Cully
|
r3367 | if not line: | ||
Bryan O'Sullivan
|
r4898 | raise PatchError(_('could not extract binary patch')) | ||
Bryan O'Sullivan
|
r4897 | size = int(line[8:].rstrip()) | ||
Brendan Cully
|
r3367 | dec = [] | ||
Patrick Mezard
|
r7153 | line = lr.readline() | ||
Bryan O'Sullivan
|
r4897 | self.hunk.append(line) | ||
while len(line) > 1: | ||||
Brendan Cully
|
r3374 | l = line[0] | ||
if l <= 'Z' and l >= 'A': | ||||
l = ord(l) - ord('A') + 1 | ||||
else: | ||||
l = ord(l) - ord('a') + 27 | ||||
Bryan O'Sullivan
|
r4897 | dec.append(base85.b85decode(line[1:-1])[:l]) | ||
Patrick Mezard
|
r7153 | line = lr.readline() | ||
Bryan O'Sullivan
|
r4897 | self.hunk.append(line) | ||
Brendan Cully
|
r3367 | text = zlib.decompress(''.join(dec)) | ||
if len(text) != size: | ||||
Bryan O'Sullivan
|
r4898 | raise PatchError(_('binary patch is %d bytes, not %d') % | ||
Bryan O'Sullivan
|
r4897 | len(text), size) | ||
self.text = text | ||||
Brendan Cully
|
r3367 | |||
Bryan O'Sullivan
|
r4897 | def parsefilename(str): | ||
# --- filename \t|space stuff | ||||
Patrick Mezard
|
r5851 | s = str[4:].rstrip('\r\n') | ||
Bryan O'Sullivan
|
r4897 | i = s.find('\t') | ||
if i < 0: | ||||
i = s.find(' ') | ||||
if i < 0: | ||||
return s | ||||
return s[:i] | ||||
Brendan Cully
|
r2861 | |||
Mads Kiilerich
|
r11022 | def pathstrip(path, strip): | ||
pathlen = len(path) | ||||
i = 0 | ||||
if strip == 0: | ||||
return '', path.rstrip() | ||||
count = strip | ||||
while count > 0: | ||||
i = path.find('/', i) | ||||
if i == -1: | ||||
raise PatchError(_("unable to strip away %d of %d dirs from %s") % | ||||
(count, strip, path)) | ||||
i += 1 | ||||
# consume '//' in the path | ||||
while i < pathlen - 1 and path[i] == '/': | ||||
i += 1 | ||||
count -= 1 | ||||
return path[:i].lstrip(), path[i:].rstrip() | ||||
Patrick Mezard
|
r14566 | def makepatchmeta(backend, afile_orig, bfile_orig, hunk, strip): | ||
Bryan O'Sullivan
|
r4897 | nulla = afile_orig == "/dev/null" | ||
nullb = bfile_orig == "/dev/null" | ||||
Patrick Mezard
|
r14451 | create = nulla and hunk.starta == 0 and hunk.lena == 0 | ||
remove = nullb and hunk.startb == 0 and hunk.lenb == 0 | ||||
Patrick Mezard
|
r6295 | abase, afile = pathstrip(afile_orig, strip) | ||
Patrick Mezard
|
r14351 | gooda = not nulla and backend.exists(afile) | ||
Patrick Mezard
|
r6295 | bbase, bfile = pathstrip(bfile_orig, strip) | ||
Bryan O'Sullivan
|
r4897 | if afile == bfile: | ||
goodb = gooda | ||||
else: | ||||
Patrick Mezard
|
r14351 | goodb = not nullb and backend.exists(bfile) | ||
Patrick Mezard
|
r14451 | missing = not goodb and not gooda and not create | ||
Brendan Cully
|
r9328 | |||
Martin Geisler
|
r11820 | # some diff programs apparently produce patches where the afile is | ||
# not /dev/null, but afile starts with bfile | ||||
Benoit Boissinot
|
r10745 | abasedir = afile[:afile.rfind('/') + 1] | ||
bbasedir = bfile[:bfile.rfind('/') + 1] | ||||
Patrick Mezard
|
r14451 | if (missing and abasedir == bbasedir and afile.startswith(bfile) | ||
and hunk.starta == 0 and hunk.lena == 0): | ||||
create = True | ||||
missing = False | ||||
Brendan Cully
|
r9328 | |||
Patrick Mezard
|
r6295 | # If afile is "a/b/foo" and bfile is "a/b/foo.orig" we assume the | ||
# diff is between a file and its backup. In this case, the original | ||||
# file should be patched (see original mpatch code). | ||||
isbackup = (abase == bbase and bfile.startswith(afile)) | ||||
Patrick Mezard
|
r5652 | fname = None | ||
if not missing: | ||||
if gooda and goodb: | ||||
Patrick Mezard
|
r6295 | fname = isbackup and afile or bfile | ||
Patrick Mezard
|
r5652 | elif gooda: | ||
Bryan O'Sullivan
|
r4897 | fname = afile | ||
Thomas Arendsen Hein
|
r5760 | |||
Patrick Mezard
|
r5652 | if not fname: | ||
if not nullb: | ||||
Patrick Mezard
|
r6295 | fname = isbackup and afile or bfile | ||
Patrick Mezard
|
r5652 | elif not nulla: | ||
Bryan O'Sullivan
|
r4897 | fname = afile | ||
Patrick Mezard
|
r5652 | else: | ||
raise PatchError(_("undefined source and destination files")) | ||||
Thomas Arendsen Hein
|
r5760 | |||
Patrick Mezard
|
r14566 | gp = patchmeta(fname) | ||
if create: | ||||
gp.op = 'ADD' | ||||
elif remove: | ||||
gp.op = 'DELETE' | ||||
return gp | ||||
Bryan O'Sullivan
|
r4897 | |||
Patrick Mezard
|
r7152 | def scangitpatch(lr, firstline): | ||
Dirkjan Ochtman
|
r7186 | """ | ||
Patrick Mezard
|
r7152 | Git patches can emit: | ||
- rename a to b | ||||
- change b | ||||
- copy a to c | ||||
- change c | ||||
Dirkjan Ochtman
|
r7186 | |||
Patrick Mezard
|
r7152 | We cannot apply this sequence as-is, the renamed 'a' could not be | ||
found for it would have been renamed already. And we cannot copy | ||||
from 'b' instead because 'b' would have been changed already. So | ||||
we scan the git patch for copy and rename commands so we can | ||||
perform the copies ahead of time. | ||||
""" | ||||
pos = 0 | ||||
try: | ||||
pos = lr.fp.tell() | ||||
fp = lr.fp | ||||
except IOError: | ||||
fp = cStringIO.StringIO(lr.fp.read()) | ||||
Patrick Mezard
|
r14418 | gitlr = linereader(fp) | ||
Patrick Mezard
|
r7152 | gitlr.push(firstline) | ||
Patrick Mezard
|
r12669 | gitpatches = readgitpatch(gitlr) | ||
Patrick Mezard
|
r7152 | fp.seek(pos) | ||
Patrick Mezard
|
r12669 | return gitpatches | ||
Patrick Mezard
|
r7152 | |||
Idan Kamara
|
r14240 | def iterhunks(fp): | ||
Patrick Mezard
|
r5650 | """Read a patch and yield the following events: | ||
- ("file", afile, bfile, firsthunk): select a new target file. | ||||
- ("hunk", hunk): a new hunk is ready to be applied, follows a | ||||
"file" event. | ||||
- ("git", gitchanges): current diff is in git format, gitchanges | ||||
maps filenames to gitpatch records. Unique event. | ||||
""" | ||||
Bryan O'Sullivan
|
r4897 | afile = "" | ||
bfile = "" | ||||
state = None | ||||
hunknum = 0 | ||||
Patrick Mezard
|
r14017 | emitfile = newfile = False | ||
Patrick Mezard
|
r14388 | gitpatches = None | ||
Brendan Cully
|
r2861 | |||
Bryan O'Sullivan
|
r4897 | # our states | ||
BFILE = 1 | ||||
context = None | ||||
Patrick Mezard
|
r10128 | lr = linereader(fp) | ||
Brendan Cully
|
r2861 | |||
Bryan O'Sullivan
|
r4897 | while True: | ||
x = lr.readline() | ||||
if not x: | ||||
break | ||||
Patrick Mezard
|
r14383 | if state == BFILE and ( | ||
(not context and x[0] == '@') | ||||
or (context is not False and x.startswith('***************')) | ||||
or x.startswith('GIT binary patch')): | ||||
Patrick Mezard
|
r14388 | gp = None | ||
Patrick Mezard
|
r14534 | if (gitpatches and | ||
(gitpatches[-1][0] == afile or gitpatches[-1][1] == bfile)): | ||||
gp = gitpatches.pop()[2] | ||||
Patrick Mezard
|
r14383 | if x.startswith('GIT binary patch'): | ||
Patrick Mezard
|
r14451 | h = binhunk(lr) | ||
Patrick Mezard
|
r14383 | else: | ||
if context is None and x.startswith('***************'): | ||||
context = True | ||||
Patrick Mezard
|
r14451 | h = hunk(x, hunknum + 1, lr, context) | ||
Bryan O'Sullivan
|
r4897 | hunknum += 1 | ||
Patrick Mezard
|
r5650 | if emitfile: | ||
emitfile = False | ||||
Patrick Mezard
|
r14566 | yield 'file', (afile, bfile, h, gp and gp.copy() or None) | ||
Patrick Mezard
|
r13699 | yield 'hunk', h | ||
Bryan O'Sullivan
|
r4897 | elif x.startswith('diff --git'): | ||
m = gitre.match(x) | ||||
Patrick Mezard
|
r14387 | if not m: | ||
continue | ||||
Dan Villiom Podlaski Christiansen
|
r15086 | if not gitpatches: | ||
Patrick Mezard
|
r14387 | # scan whole input for git metadata | ||
Patrick Mezard
|
r14534 | gitpatches = [('a/' + gp.path, 'b/' + gp.path, gp) for gp | ||
Patrick Mezard
|
r14388 | in scangitpatch(lr, x)] | ||
Patrick Mezard
|
r14566 | yield 'git', [g[2].copy() for g in gitpatches | ||
Patrick Mezard
|
r14534 | if g[2].op in ('COPY', 'RENAME')] | ||
Patrick Mezard
|
r14388 | gitpatches.reverse() | ||
Patrick Mezard
|
r14387 | afile = 'a/' + m.group(1) | ||
bfile = 'b/' + m.group(2) | ||||
Patrick Mezard
|
r14534 | while afile != gitpatches[-1][0] and bfile != gitpatches[-1][1]: | ||
gp = gitpatches.pop()[2] | ||||
Patrick Mezard
|
r14566 | yield 'file', ('a/' + gp.path, 'b/' + gp.path, None, gp.copy()) | ||
Patrick Mezard
|
r14534 | gp = gitpatches[-1][2] | ||
Patrick Mezard
|
r14387 | # copy/rename + modify should modify target, not source | ||
if gp.op in ('COPY', 'DELETE', 'RENAME', 'ADD') or gp.mode: | ||||
afile = bfile | ||||
newfile = True | ||||
Bryan O'Sullivan
|
r4897 | elif x.startswith('---'): | ||
# check for a unified diff | ||||
l2 = lr.readline() | ||||
if not l2.startswith('+++'): | ||||
lr.push(l2) | ||||
continue | ||||
newfile = True | ||||
context = False | ||||
afile = parsefilename(x) | ||||
bfile = parsefilename(l2) | ||||
elif x.startswith('***'): | ||||
# check for a context diff | ||||
l2 = lr.readline() | ||||
if not l2.startswith('---'): | ||||
lr.push(l2) | ||||
continue | ||||
l3 = lr.readline() | ||||
lr.push(l3) | ||||
if not l3.startswith("***************"): | ||||
lr.push(l2) | ||||
continue | ||||
newfile = True | ||||
context = True | ||||
afile = parsefilename(x) | ||||
bfile = parsefilename(l2) | ||||
Benoit Boissinot
|
r3057 | |||
Patrick Mezard
|
r14017 | if newfile: | ||
newfile = False | ||||
Patrick Mezard
|
r5650 | emitfile = True | ||
Bryan O'Sullivan
|
r4897 | state = BFILE | ||
hunknum = 0 | ||||
Patrick Mezard
|
r5650 | |||
Patrick Mezard
|
r14388 | while gitpatches: | ||
Patrick Mezard
|
r14534 | gp = gitpatches.pop()[2] | ||
Patrick Mezard
|
r14566 | yield 'file', ('a/' + gp.path, 'b/' + gp.path, None, gp.copy()) | ||
Patrick Mezard
|
r14388 | |||
Patrick Mezard
|
r14565 | def applydiff(ui, fp, backend, store, strip=1, eolmode='strict'): | ||
Augie Fackler
|
r10966 | """Reads a patch from fp and tries to apply it. | ||
Patrick Mezard
|
r5650 | |||
Patrick Mezard
|
r14565 | Returns 0 for a clean patch, -1 if any rejects were found and 1 if | ||
there was any fuzz. | ||||
Patrick Mezard
|
r8810 | |||
Martin Geisler
|
r10101 | If 'eolmode' is 'strict', the patch content and patched file are | ||
read in binary mode. Otherwise, line endings are ignored when | ||||
patching then normalized according to 'eolmode'. | ||||
Patrick Mezard
|
r8810 | """ | ||
Patrick Mezard
|
r14565 | return _applydiff(ui, fp, patchfile, backend, store, strip=strip, | ||
Patrick Mezard
|
r12916 | eolmode=eolmode) | ||
Augie Fackler
|
r10966 | |||
Patrick Mezard
|
r14565 | def _applydiff(ui, fp, patcher, backend, store, strip=1, | ||
Patrick Mezard
|
r14452 | eolmode='strict'): | ||
Patrick Mezard
|
r14389 | |||
def pstrip(p): | ||||
return pathstrip(p, strip - 1)[1] | ||||
Patrick Mezard
|
r5650 | rejects = 0 | ||
err = 0 | ||||
current_file = None | ||||
Idan Kamara
|
r14240 | for state, values in iterhunks(fp): | ||
Patrick Mezard
|
r5650 | if state == 'hunk': | ||
if not current_file: | ||||
continue | ||||
Mads Kiilerich
|
r11021 | ret = current_file.apply(values) | ||
Patrick Mezard
|
r14565 | if ret > 0: | ||
err = 1 | ||||
Patrick Mezard
|
r5650 | elif state == 'file': | ||
Patrick Mezard
|
r13701 | if current_file: | ||
rejects += current_file.close() | ||||
Patrick Mezard
|
r14388 | current_file = None | ||
afile, bfile, first_hunk, gp = values | ||||
if gp: | ||||
Patrick Mezard
|
r14389 | path = pstrip(gp.path) | ||
Patrick Mezard
|
r14566 | gp.path = pstrip(gp.path) | ||
Patrick Mezard
|
r14452 | if gp.oldpath: | ||
Patrick Mezard
|
r14566 | gp.oldpath = pstrip(gp.oldpath) | ||
else: | ||||
gp = makepatchmeta(backend, afile, bfile, first_hunk, strip) | ||||
if gp.op == 'RENAME': | ||||
backend.unlink(gp.oldpath) | ||||
Patrick Mezard
|
r14388 | if not first_hunk: | ||
Patrick Mezard
|
r14566 | if gp.op == 'DELETE': | ||
backend.unlink(gp.path) | ||||
continue | ||||
data, mode = None, None | ||||
if gp.op in ('RENAME', 'COPY'): | ||||
Patrick Mezard
|
r14609 | data, mode = store.getfile(gp.oldpath)[:2] | ||
Patrick Mezard
|
r14566 | if gp.mode: | ||
mode = gp.mode | ||||
if gp.op == 'ADD': | ||||
# Added files without content have no hunk and | ||||
# must be created | ||||
data = '' | ||||
if data or mode: | ||||
if (gp.op in ('ADD', 'RENAME', 'COPY') | ||||
and backend.exists(gp.path)): | ||||
raise PatchError(_("cannot create %s: destination " | ||||
"already exists") % gp.path) | ||||
backend.setfile(gp.path, data, mode, gp.oldpath) | ||||
Patrick Mezard
|
r14388 | continue | ||
Patrick Mezard
|
r5650 | try: | ||
Patrick Mezard
|
r14566 | current_file = patcher(ui, gp, backend, store, | ||
eolmode=eolmode) | ||||
Martin Geisler
|
r14218 | except PatchError, inst: | ||
ui.warn(str(inst) + '\n') | ||||
Mads Kiilerich
|
r11021 | current_file = None | ||
Patrick Mezard
|
r5650 | rejects += 1 | ||
continue | ||||
elif state == 'git': | ||||
Mads Kiilerich
|
r11021 | for gp in values: | ||
Patrick Mezard
|
r14452 | path = pstrip(gp.oldpath) | ||
data, mode = backend.getfile(path) | ||||
store.setfile(path, data, mode) | ||||
Bryan O'Sullivan
|
r4897 | else: | ||
Patrick Mezard
|
r5650 | raise util.Abort(_('unsupported parser state: %s') % state) | ||
Patrick Mezard
|
r5649 | |||
Patrick Mezard
|
r13701 | if current_file: | ||
rejects += current_file.close() | ||||
Patrick Mezard
|
r5650 | |||
Bryan O'Sullivan
|
r4897 | if rejects: | ||
return -1 | ||||
return err | ||||
Vadim Gelfer
|
r2874 | |||
Patrick Mezard
|
r14382 | def _externalpatch(ui, repo, patcher, patchname, strip, files, | ||
Patrick Mezard
|
r14381 | similarity): | ||
Patrick Mezard
|
r7151 | """use <patcher> to apply <patchname> to the working directory. | ||
returns whether patch was applied with fuzz factor.""" | ||||
fuzz = False | ||||
Patrick Mezard
|
r12673 | args = [] | ||
Patrick Mezard
|
r14382 | cwd = repo.root | ||
Patrick Mezard
|
r7151 | if cwd: | ||
args.append('-d %s' % util.shellquote(cwd)) | ||||
fp = util.popen('%s %s -p%d < %s' % (patcher, ' '.join(args), strip, | ||||
util.shellquote(patchname))) | ||||
Patrick Mezard
|
r14381 | try: | ||
for line in fp: | ||||
line = line.rstrip() | ||||
ui.note(line + '\n') | ||||
if line.startswith('patching file '): | ||||
pf = util.parsepatchoutput(line) | ||||
printed_file = False | ||||
Patrick Mezard
|
r14564 | files.add(pf) | ||
Patrick Mezard
|
r14381 | elif line.find('with fuzz') >= 0: | ||
fuzz = True | ||||
if not printed_file: | ||||
ui.warn(pf + '\n') | ||||
printed_file = True | ||||
ui.warn(line + '\n') | ||||
elif line.find('saving rejects to file') >= 0: | ||||
ui.warn(line + '\n') | ||||
elif line.find('FAILED') >= 0: | ||||
if not printed_file: | ||||
ui.warn(pf + '\n') | ||||
printed_file = True | ||||
ui.warn(line + '\n') | ||||
finally: | ||||
if files: | ||||
cfiles = list(files) | ||||
cwd = repo.getcwd() | ||||
if cwd: | ||||
cfiles = [util.pathto(repo.root, cwd, f) | ||||
Peter Arrenbrecht
|
r14695 | for f in cfiles] | ||
Patrick Mezard
|
r14381 | scmutil.addremove(repo, cfiles, similarity=similarity) | ||
Patrick Mezard
|
r7151 | code = fp.close() | ||
if code: | ||||
raise PatchError(_("patch command failed: %s") % | ||||
Adrian Buehlmann
|
r14234 | util.explainexit(code)[0]) | ||
Patrick Mezard
|
r7151 | return fuzz | ||
Patrick Mezard
|
r14611 | def patchbackend(ui, backend, patchobj, strip, files=None, eolmode='strict'): | ||
Benoit Boissinot
|
r9683 | if files is None: | ||
Patrick Mezard
|
r14564 | files = set() | ||
Patrick Mezard
|
r8810 | if eolmode is None: | ||
eolmode = ui.config('patch', 'eol', 'strict') | ||||
Martin Geisler
|
r10101 | if eolmode.lower() not in eolmodes: | ||
Martin Geisler
|
r12067 | raise util.Abort(_('unsupported line endings type: %s') % eolmode) | ||
Martin Geisler
|
r10101 | eolmode = eolmode.lower() | ||
Dirkjan Ochtman
|
r8843 | |||
Patrick Mezard
|
r14452 | store = filestore() | ||
Patrick Mezard
|
r7151 | try: | ||
Alejandro Santos
|
r9031 | fp = open(patchobj, 'rb') | ||
Patrick Mezard
|
r7151 | except TypeError: | ||
fp = patchobj | ||||
try: | ||||
Patrick Mezard
|
r14565 | ret = applydiff(ui, fp, backend, store, strip=strip, | ||
Patrick Mezard
|
r14452 | eolmode=eolmode) | ||
Patrick Mezard
|
r7151 | finally: | ||
Patrick Mezard
|
r10203 | if fp != patchobj: | ||
fp.close() | ||||
Patrick Mezard
|
r14564 | files.update(backend.close()) | ||
Patrick Mezard
|
r14452 | store.close() | ||
Patrick Mezard
|
r7151 | if ret < 0: | ||
Patrick Mezard
|
r12674 | raise PatchError(_('patch failed to apply')) | ||
Patrick Mezard
|
r7151 | return ret > 0 | ||
Patrick Mezard
|
r14611 | def internalpatch(ui, repo, patchobj, strip, files=None, eolmode='strict', | ||
similarity=0): | ||||
"""use builtin patch to apply <patchobj> to the working directory. | ||||
returns whether patch was applied with fuzz factor.""" | ||||
backend = workingbackend(ui, repo, similarity) | ||||
return patchbackend(ui, backend, patchobj, strip, files, eolmode) | ||||
def patchrepo(ui, repo, ctx, store, patchobj, strip, files=None, | ||||
eolmode='strict'): | ||||
backend = repobackend(ui, repo, ctx, store) | ||||
return patchbackend(ui, backend, patchobj, strip, files, eolmode) | ||||
def makememctx(repo, parents, text, user, date, branch, files, store, | ||||
editor=None): | ||||
def getfilectx(repo, memctx, path): | ||||
data, (islink, isexec), copied = store.getfile(path) | ||||
return context.memfilectx(path, data, islink=islink, isexec=isexec, | ||||
copied=copied) | ||||
extra = {} | ||||
if branch: | ||||
extra['branch'] = encoding.fromlocal(branch) | ||||
ctx = context.memctx(repo, parents, text, files, getfilectx, user, | ||||
date, extra) | ||||
if editor: | ||||
ctx._text = editor(repo, ctx, []) | ||||
return ctx | ||||
Patrick Mezard
|
r14382 | def patch(ui, repo, patchname, strip=1, files=None, eolmode='strict', | ||
Patrick Mezard
|
r14260 | similarity=0): | ||
Patrick Mezard
|
r8810 | """Apply <patchname> to the working directory. | ||
'eolmode' specifies how end of lines should be handled. It can be: | ||||
- 'strict': inputs are read in binary mode, EOLs are preserved | ||||
- 'crlf': EOLs are ignored when patching and reset to CRLF | ||||
- 'lf': EOLs are ignored when patching and reset to LF | ||||
- None: get it from user settings, default to 'strict' | ||||
'eolmode' is ignored when using an external patcher program. | ||||
Returns whether patch was applied with fuzz factor. | ||||
""" | ||||
Patrick Mezard
|
r7151 | patcher = ui.config('ui', 'patch') | ||
Benoit Boissinot
|
r9683 | if files is None: | ||
Patrick Mezard
|
r14564 | files = set() | ||
Patrick Mezard
|
r7151 | try: | ||
if patcher: | ||||
Patrick Mezard
|
r14381 | return _externalpatch(ui, repo, patcher, patchname, strip, | ||
Patrick Mezard
|
r14382 | files, similarity) | ||
Patrick Mezard
|
r14370 | return internalpatch(ui, repo, patchname, strip, files, eolmode, | ||
Patrick Mezard
|
r14260 | similarity) | ||
Patrick Mezard
|
r7151 | except PatchError, err: | ||
Patrick Mezard
|
r12674 | raise util.Abort(str(err)) | ||
Patrick Mezard
|
r7151 | |||
Patrick Mezard
|
r14351 | def changedfiles(ui, repo, patchpath, strip=1): | ||
backend = fsbackend(ui, repo.root) | ||||
Idan Kamara
|
r14255 | fp = open(patchpath, 'rb') | ||
try: | ||||
changed = set() | ||||
for state, values in iterhunks(fp): | ||||
Patrick Mezard
|
r14389 | if state == 'file': | ||
Patrick Mezard
|
r14388 | afile, bfile, first_hunk, gp = values | ||
if gp: | ||||
Patrick Mezard
|
r14566 | gp.path = pathstrip(gp.path, strip - 1)[1] | ||
if gp.oldpath: | ||||
gp.oldpath = pathstrip(gp.oldpath, strip - 1)[1] | ||||
else: | ||||
gp = makepatchmeta(backend, afile, bfile, first_hunk, strip) | ||||
changed.add(gp.path) | ||||
if gp.op == 'RENAME': | ||||
changed.add(gp.oldpath) | ||||
Patrick Mezard
|
r14389 | elif state not in ('hunk', 'git'): | ||
Idan Kamara
|
r14255 | raise util.Abort(_('unsupported parser state: %s') % state) | ||
return changed | ||||
finally: | ||||
fp.close() | ||||
Bryan O'Sullivan
|
r5033 | def b85diff(to, tn): | ||
Brendan Cully
|
r3367 | '''print base85-encoded binary diff''' | ||
def gitindex(text): | ||||
if not text: | ||||
Martin Geisler
|
r12144 | return hex(nullid) | ||
Brendan Cully
|
r3367 | l = len(text) | ||
Dirkjan Ochtman
|
r6470 | s = util.sha1('blob %d\0' % l) | ||
Brendan Cully
|
r3367 | s.update(text) | ||
return s.hexdigest() | ||||
def fmtline(line): | ||||
l = len(line) | ||||
if l <= 26: | ||||
l = chr(ord('A') + l - 1) | ||||
else: | ||||
l = chr(l - 26 + ord('a') - 1) | ||||
return '%c%s\n' % (l, base85.b85encode(line, True)) | ||||
def chunk(text, csize=52): | ||||
l = len(text) | ||||
i = 0 | ||||
while i < l: | ||||
Matt Mackall
|
r10282 | yield text[i:i + csize] | ||
Brendan Cully
|
r3367 | i += csize | ||
Alexis S. L. Carvalho
|
r4105 | tohash = gitindex(to) | ||
tnhash = gitindex(tn) | ||||
if tohash == tnhash: | ||||
Alexis S. L. Carvalho
|
r4106 | return "" | ||
Brendan Cully
|
r3367 | # TODO: deltas | ||
Alexis S. L. Carvalho
|
r4106 | ret = ['index %s..%s\nGIT binary patch\nliteral %s\n' % | ||
(tohash, tnhash, len(tn))] | ||||
for l in chunk(zlib.compress(tn)): | ||||
ret.append(fmtline(l)) | ||||
ret.append('\n') | ||||
return ''.join(ret) | ||||
Brendan Cully
|
r3367 | |||
Patrick Mezard
|
r10189 | class GitDiffRequired(Exception): | ||
pass | ||||
Dirkjan Ochtman
|
r7198 | |||
Patrick Mezard
|
r15528 | def diffopts(ui, opts=None, untrusted=False, section='diff'): | ||
Benoit Boissinot
|
r10615 | def get(key, name=None, getter=ui.configbool): | ||
return ((opts and opts.get(key)) or | ||||
Patrick Mezard
|
r15528 | getter(section, name or key, None, untrusted=untrusted)) | ||
Benoit Boissinot
|
r10615 | return mdiff.diffopts( | ||
text=opts and opts.get('text'), | ||||
git=get('git'), | ||||
nodates=get('nodates'), | ||||
showfunc=get('show_function', 'showfunc'), | ||||
ignorews=get('ignore_all_space', 'ignorews'), | ||||
ignorewsamount=get('ignore_space_change', 'ignorewsamount'), | ||||
ignoreblanklines=get('ignore_blank_lines', 'ignoreblanklines'), | ||||
context=get('unified', getter=ui.config)) | ||||
Patrick Mezard
|
r10189 | def diff(repo, node1=None, node2=None, match=None, changes=None, opts=None, | ||
Martin Geisler
|
r12167 | losedatafn=None, prefix=''): | ||
Dirkjan Ochtman
|
r7308 | '''yields diff of changes to files between two nodes, or node and | ||
Vadim Gelfer
|
r2874 | working directory. | ||
if node1 is None, use first dirstate parent instead. | ||||
Patrick Mezard
|
r10189 | if node2 is None, compare node1 with working directory. | ||
losedatafn(**kwarg) is a callable run when opts.upgrade=True and | ||||
every time some change cannot be represented with the current | ||||
patch format. Return False to upgrade to git patch format, True to | ||||
accept the loss or raise an exception to abort the diff. It is | ||||
called with the name of current file being diffed as 'fn'. If set | ||||
to None, patches will always be upgraded to git format when | ||||
necessary. | ||||
Martin Geisler
|
r12167 | |||
prefix is a filename prefix that is prepended to all filenames on | ||||
display (used for subrepos). | ||||
Patrick Mezard
|
r10189 | ''' | ||
Vadim Gelfer
|
r2874 | |||
if opts is None: | ||||
opts = mdiff.defaultopts | ||||
Yannick Gingras
|
r9725 | if not node1 and not node2: | ||
Matt Mackall
|
r13878 | node1 = repo.dirstate.p1() | ||
Brendan Cully
|
r2934 | |||
Brendan Cully
|
r9123 | def lrugetfilectx(): | ||
cache = {} | ||||
order = [] | ||||
def getfilectx(f, ctx): | ||||
fctx = ctx.filectx(f, filelog=cache.get(f)) | ||||
if f not in cache: | ||||
if len(cache) > 20: | ||||
del cache[order.pop(0)] | ||||
Benoit Boissinot
|
r9684 | cache[f] = fctx.filelog() | ||
Brendan Cully
|
r9123 | else: | ||
order.remove(f) | ||||
order.append(f) | ||||
return fctx | ||||
return getfilectx | ||||
getfilectx = lrugetfilectx() | ||||
Brendan Cully
|
r2934 | |||
Matt Mackall
|
r6747 | ctx1 = repo[node1] | ||
Matt Mackall
|
r7090 | ctx2 = repo[node2] | ||
Vadim Gelfer
|
r2874 | |||
if not changes: | ||||
Matt Mackall
|
r7090 | changes = repo.status(ctx1, ctx2, match=match) | ||
Matt Mackall
|
r6760 | modified, added, removed = changes[:3] | ||
Vadim Gelfer
|
r2874 | |||
if not modified and not added and not removed: | ||||
Patrick Mezard
|
r10189 | return [] | ||
revs = None | ||||
if not repo.ui.quiet: | ||||
hexfunc = repo.ui.debugflag and hex or short | ||||
revs = [hexfunc(node) for node in [node1, node2] if node] | ||||
copy = {} | ||||
if opts.git or opts.upgrade: | ||||
Matt Mackall
|
r15774 | copy = copies.pathcopies(ctx1, ctx2) | ||
Patrick Mezard
|
r10189 | |||
difffn = lambda opts, losedata: trydiff(repo, revs, ctx1, ctx2, | ||||
Martin Geisler
|
r12167 | modified, added, removed, copy, getfilectx, opts, losedata, prefix) | ||
Patrick Mezard
|
r10189 | if opts.upgrade and not opts.git: | ||
try: | ||||
def losedata(fn): | ||||
if not losedatafn or not losedatafn(fn=fn): | ||||
raise GitDiffRequired() | ||||
# Buffer the whole output until we are sure it can be generated | ||||
return list(difffn(opts.copy(git=False), losedata)) | ||||
except GitDiffRequired: | ||||
return difffn(opts.copy(git=True), None) | ||||
else: | ||||
return difffn(opts, None) | ||||
Brodie Rao
|
r10818 | def difflabel(func, *args, **kw): | ||
'''yields 2-tuples of (output, label) based on the output of func()''' | ||||
Kirill Elagin
|
r15201 | headprefixes = [('diff', 'diff.diffline'), | ||
('copy', 'diff.extended'), | ||||
('rename', 'diff.extended'), | ||||
('old', 'diff.extended'), | ||||
('new', 'diff.extended'), | ||||
('deleted', 'diff.extended'), | ||||
('---', 'diff.file_a'), | ||||
('+++', 'diff.file_b')] | ||||
textprefixes = [('@', 'diff.hunk'), | ||||
('-', 'diff.deleted'), | ||||
('+', 'diff.inserted')] | ||||
head = False | ||||
Brodie Rao
|
r10818 | for chunk in func(*args, **kw): | ||
lines = chunk.split('\n') | ||||
for i, line in enumerate(lines): | ||||
if i != 0: | ||||
yield ('\n', '') | ||||
Kirill Elagin
|
r15201 | if head: | ||
if line.startswith('@'): | ||||
head = False | ||||
else: | ||||
Benoit Allard
|
r15582 | if line and not line[0] in ' +-@\\': | ||
Kirill Elagin
|
r15201 | head = True | ||
Brodie Rao
|
r10818 | stripline = line | ||
Kirill Elagin
|
r15201 | if not head and line and line[0] in '+-': | ||
Brodie Rao
|
r10818 | # highlight trailing whitespace, but only in changed lines | ||
stripline = line.rstrip() | ||||
Kirill Elagin
|
r15201 | prefixes = textprefixes | ||
if head: | ||||
prefixes = headprefixes | ||||
Brodie Rao
|
r10818 | for prefix, label in prefixes: | ||
if stripline.startswith(prefix): | ||||
yield (stripline, label) | ||||
break | ||||
else: | ||||
yield (line, '') | ||||
if line != stripline: | ||||
yield (line[len(stripline):], 'diff.trailingwhitespace') | ||||
def diffui(*args, **kw): | ||||
'''like diff(), but yields 2-tuples of (output, label) for ui.write()''' | ||||
return difflabel(diff, *args, **kw) | ||||
Patrick Mezard
|
r10189 | def _addmodehdr(header, omode, nmode): | ||
if omode != nmode: | ||||
header.append('old mode %s\n' % omode) | ||||
header.append('new mode %s\n' % nmode) | ||||
def trydiff(repo, revs, ctx1, ctx2, modified, added, removed, | ||||
Martin Geisler
|
r12167 | copy, getfilectx, opts, losedatafn, prefix): | ||
def join(f): | ||||
return os.path.join(prefix, f) | ||||
Vadim Gelfer
|
r2874 | |||
Matt Mackall
|
r7090 | date1 = util.datestr(ctx1.date()) | ||
man1 = ctx1.manifest() | ||||
Benoit Boissinot
|
r3967 | |||
Patrick Mezard
|
r10189 | gone = set() | ||
gitmode = {'l': '120000', 'x': '100755', '': '100644'} | ||||
Vadim Gelfer
|
r2874 | |||
Wagner Bruna
|
r10466 | copyto = dict([(v, k) for k, v in copy.items()]) | ||
Brendan Cully
|
r2907 | if opts.git: | ||
Patrick Mezard
|
r10189 | revs = None | ||
Matt Mackall
|
r3996 | |||
Matt Mackall
|
r8209 | for f in sorted(modified + added + removed): | ||
Vadim Gelfer
|
r2874 | to = None | ||
tn = None | ||||
Brendan Cully
|
r2907 | dodiff = True | ||
Brendan Cully
|
r3329 | header = [] | ||
Benoit Boissinot
|
r3967 | if f in man1: | ||
to = getfilectx(f, ctx1).data() | ||||
Vadim Gelfer
|
r2874 | if f not in removed: | ||
Benoit Boissinot
|
r3967 | tn = getfilectx(f, ctx2).data() | ||
Dustin Sallings
|
r5482 | a, b = f, f | ||
Patrick Mezard
|
r10189 | if opts.git or losedatafn: | ||
Brendan Cully
|
r2907 | if f in added: | ||
Matt Mackall
|
r6743 | mode = gitmode[ctx2.flags(f)] | ||
Wagner Bruna
|
r10466 | if f in copy or f in copyto: | ||
Patrick Mezard
|
r10189 | if opts.git: | ||
Wagner Bruna
|
r10466 | if f in copy: | ||
a = copy[f] | ||||
else: | ||||
a = copyto[f] | ||||
Patrick Mezard
|
r10189 | omode = gitmode[man1.flags(a)] | ||
_addmodehdr(header, omode, mode) | ||||
if a in removed and a not in gone: | ||||
op = 'rename' | ||||
gone.add(a) | ||||
else: | ||||
op = 'copy' | ||||
Martin Geisler
|
r12167 | header.append('%s from %s\n' % (op, join(a))) | ||
header.append('%s to %s\n' % (op, join(f))) | ||||
Patrick Mezard
|
r10189 | to = getfilectx(a, ctx1).data() | ||
Alexis S. L. Carvalho
|
r3702 | else: | ||
Patrick Mezard
|
r10189 | losedatafn(f) | ||
Brendan Cully
|
r2907 | else: | ||
Patrick Mezard
|
r10189 | if opts.git: | ||
header.append('new file mode %s\n' % mode) | ||||
elif ctx2.flags(f): | ||||
losedatafn(f) | ||||
Patrick Mezard
|
r12576 | # In theory, if tn was copied or renamed we should check | ||
# if the source is binary too but the copy record already | ||||
# forces git mode. | ||||
Alexis S. L. Carvalho
|
r4092 | if util.binary(tn): | ||
Patrick Mezard
|
r10189 | if opts.git: | ||
dodiff = 'binary' | ||||
else: | ||||
losedatafn(f) | ||||
if not opts.git and not tn: | ||||
# regular diffs cannot represent new empty file | ||||
losedatafn(f) | ||||
Brendan Cully
|
r2907 | elif f in removed: | ||
Patrick Mezard
|
r10189 | if opts.git: | ||
# have we already reported a copy above? | ||||
Patrick Mezard
|
r10467 | if ((f in copy and copy[f] in added | ||
and copyto[copy[f]] == f) or | ||||
(f in copyto and copyto[f] in added | ||||
and copy[copyto[f]] == f)): | ||||
Patrick Mezard
|
r10189 | dodiff = False | ||
else: | ||||
header.append('deleted file mode %s\n' % | ||||
gitmode[man1.flags(f)]) | ||||
Patrick Mezard
|
r12575 | elif not to or util.binary(to): | ||
Patrick Mezard
|
r10189 | # regular diffs cannot represent empty file deletion | ||
losedatafn(f) | ||||
Brendan Cully
|
r2907 | else: | ||
Patrick Mezard
|
r10189 | oflag = man1.flags(f) | ||
nflag = ctx2.flags(f) | ||||
binary = util.binary(to) or util.binary(tn) | ||||
if opts.git: | ||||
_addmodehdr(header, gitmode[oflag], gitmode[nflag]) | ||||
if binary: | ||||
dodiff = 'binary' | ||||
elif binary or nflag != oflag: | ||||
losedatafn(f) | ||||
if opts.git: | ||||
Martin Geisler
|
r12167 | header.insert(0, mdiff.diffline(revs, join(a), join(b), opts)) | ||
Patrick Mezard
|
r10189 | |||
Alexis S. L. Carvalho
|
r4106 | if dodiff: | ||
if dodiff == 'binary': | ||||
Bryan O'Sullivan
|
r5033 | text = b85diff(to, tn) | ||
Alexis S. L. Carvalho
|
r4106 | else: | ||
Thomas Arendsen Hein
|
r4108 | text = mdiff.unidiff(to, date1, | ||
# ctx2 date may be dynamic | ||||
tn, util.datestr(ctx2.date()), | ||||
Martin Geisler
|
r12167 | join(a), join(b), revs, opts=opts) | ||
Dirkjan Ochtman
|
r7308 | if header and (text or len(header) > 1): | ||
yield ''.join(header) | ||||
if text: | ||||
yield text | ||||
Vadim Gelfer
|
r2874 | |||
Matt Mackall
|
r14401 | def diffstatsum(stats): | ||
Steven Brown
|
r14437 | maxfile, maxtotal, addtotal, removetotal, binary = 0, 0, 0, 0, False | ||
Matt Mackall
|
r14401 | for f, a, r, b in stats: | ||
maxfile = max(maxfile, encoding.colwidth(f)) | ||||
Steven Brown
|
r14437 | maxtotal = max(maxtotal, a + r) | ||
Matt Mackall
|
r14401 | addtotal += a | ||
removetotal += r | ||||
binary = binary or b | ||||
Steven Brown
|
r14437 | return maxfile, maxtotal, addtotal, removetotal, binary | ||
Matt Mackall
|
r14401 | |||
Alexander Solovyov
|
r7547 | def diffstatdata(lines): | ||
Gastón Kleiman
|
r13395 | diffre = re.compile('^diff .*-r [a-z0-9]+\s(.*)$') | ||
Matt Mackall
|
r14400 | results = [] | ||
Patrick Mezard
|
r15363 | filename, adds, removes, isbinary = None, 0, 0, False | ||
Matt Mackall
|
r14400 | |||
def addresult(): | ||||
if filename: | ||||
results.append((filename, adds, removes, isbinary)) | ||||
Alexander Solovyov
|
r7547 | for line in lines: | ||
if line.startswith('diff'): | ||||
Matt Mackall
|
r14400 | addresult() | ||
Alexander Solovyov
|
r7547 | # set numbers to 0 anyway when starting new file | ||
Patrick Mezard
|
r15363 | adds, removes, isbinary = 0, 0, False | ||
Alexander Solovyov
|
r7547 | if line.startswith('diff --git'): | ||
filename = gitre.search(line).group(1) | ||||
Gastón Kleiman
|
r13395 | elif line.startswith('diff -r'): | ||
timeless
|
r8761 | # format: "diff -r ... -r ... filename" | ||
Gastón Kleiman
|
r13395 | filename = diffre.search(line).group(1) | ||
Jesus Espino Garcia
|
r15971 | elif line.startswith('+') and not line.startswith('+++ '): | ||
Alexander Solovyov
|
r7547 | adds += 1 | ||
Jesus Espino Garcia
|
r15971 | elif line.startswith('-') and not line.startswith('--- '): | ||
Alexander Solovyov
|
r7547 | removes += 1 | ||
Patrick Mezard
|
r15363 | elif (line.startswith('GIT binary patch') or | ||
line.startswith('Binary file')): | ||||
isbinary = True | ||||
Matt Mackall
|
r14400 | addresult() | ||
return results | ||||
Alexander Solovyov
|
r7547 | |||
Brodie Rao
|
r9642 | def diffstat(lines, width=80, git=False): | ||
Alexander Solovyov
|
r7547 | output = [] | ||
Matt Mackall
|
r14402 | stats = diffstatdata(lines) | ||
Steven Brown
|
r14437 | maxname, maxtotal, totaladds, totalremoves, hasbinary = diffstatsum(stats) | ||
Alexander Solovyov
|
r7547 | |||
countwidth = len(str(maxtotal)) | ||||
Brodie Rao
|
r9642 | if hasbinary and countwidth < 3: | ||
countwidth = 3 | ||||
Brodie Rao
|
r9330 | graphwidth = width - countwidth - maxname - 6 | ||
Alexander Solovyov
|
r7547 | if graphwidth < 10: | ||
graphwidth = 10 | ||||
Brodie Rao
|
r9330 | def scale(i): | ||
if maxtotal <= graphwidth: | ||||
return i | ||||
# If diffstat runs out of room it doesn't print anything, | ||||
# which isn't very useful, so always print at least one + or - | ||||
# if there were at least some changes. | ||||
return max(i * graphwidth // maxtotal, int(bool(i))) | ||||
Alexander Solovyov
|
r7547 | |||
Matt Mackall
|
r14402 | for filename, adds, removes, isbinary in stats: | ||
Patrick Mezard
|
r15363 | if isbinary: | ||
Brodie Rao
|
r9642 | count = 'Bin' | ||
else: | ||||
count = adds + removes | ||||
Brodie Rao
|
r9330 | pluses = '+' * scale(adds) | ||
minuses = '-' * scale(removes) | ||||
FUJIWARA Katsunori
|
r11611 | output.append(' %s%s | %*s %s%s\n' % | ||
Matt Mackall
|
r14402 | (filename, ' ' * (maxname - encoding.colwidth(filename)), | ||
countwidth, count, pluses, minuses)) | ||||
Alexander Solovyov
|
r7547 | |||
if stats: | ||||
Martin Geisler
|
r9331 | output.append(_(' %d files changed, %d insertions(+), %d deletions(-)\n') | ||
Matt Mackall
|
r7860 | % (len(stats), totaladds, totalremoves)) | ||
Alexander Solovyov
|
r7547 | |||
return ''.join(output) | ||||
Brodie Rao
|
r10818 | |||
def diffstatui(*args, **kw): | ||||
'''like diffstat(), but yields 2-tuples of (output, label) for | ||||
ui.write() | ||||
''' | ||||
for line in diffstat(*args, **kw).splitlines(): | ||||
if line and line[-1] in '+-': | ||||
name, graph = line.rsplit(' ', 1) | ||||
yield (name + ' ', '') | ||||
m = re.search(r'\++', graph) | ||||
if m: | ||||
yield (m.group(0), 'diffstat.inserted') | ||||
m = re.search(r'-+', graph) | ||||
if m: | ||||
yield (m.group(0), 'diffstat.deleted') | ||||
else: | ||||
yield (line, '') | ||||
yield ('\n', '') | ||||