upstream/mercurial-mirror Commit - r38581:c88d2c9b

diffutil: extract diff options code into a dedicated util-module...

Boris Feld -

r38581:c88d2c9b default

parent child

mercurial/patch.py

0 +4 -89

              # patch.py - patch file parsing routines
              #
              # Copyright 2006 Brendan Cully <brendan@kublai.com>
              # Copyright 2007 Chris Mason <chris.mason@oracle.com>
              #
              # This software may be used and distributed according to the terms of the
              # GNU General Public License version 2 or any later version.
              from __future__ import absolute_import, print_function
              import collections
              import contextlib
              import copy
              import email
              import errno
              import hashlib
              import os
              import posixpath
              import re
              import shutil
              import zlib
              from .i18n import _
              from .node import (
                  hex,
                  short,
              )
              from . import (
                  copies,
                  diffhelper,
                  encoding,
                  error,
                  mail,
                  mdiff,
                  pathutil,
                  pycompat,
                  scmutil,
                  similar,
                  util,
                  vfs as vfsmod,
              )
              from .utils import (
                  dateutil,
+                 diffutil,
                  procutil,
                  stringutil,
              )
              stringio = util.stringio
              gitre = re.compile(br'diff --git a/(.*) b/(.*)')
              tabsplitter = re.compile(br'(\t+|[^\t]+)')
              wordsplitter = re.compile(br'(\t+| +|[a-zA-Z0-9_\x80-\xff]+|'
                                        b'[^ \ta-zA-Z0-9_\x80-\xff])')
              PatchError = error.PatchError
              # public functions
              def split(stream):
                  '''return an iterator of individual patches from a stream'''
                  def isheader(line, inheader):
                      if inheader and line.startswith((' ', '\t')):
                          # continuation
                          return True
                      if line.startswith((' ', '-', '+')):
                          # diff line - don't check for header pattern in there
                          return False
                      l = line.split(': ', 1)
                      return len(l) == 2 and ' ' not in l[0]
                  def chunk(lines):
                      return stringio(''.join(lines))
                  def hgsplit(stream, cur):
                      inheader = True
                      for line in stream:
                          if not line.strip():
                              inheader = False
                          if not inheader and line.startswith('# HG changeset patch'):
                              yield chunk(cur)
                              cur = []
                              inheader = True
                          cur.append(line)
                      if cur:
                          yield chunk(cur)
                  def mboxsplit(stream, cur):
                      for line in stream:
                          if line.startswith('From '):
                              for c in split(chunk(cur[1:])):
                                  yield c
                              cur = []
                          cur.append(line)
                      if cur:
                          for c in split(chunk(cur[1:])):
                              yield c
                  def mimesplit(stream, cur):
                      def msgfp(m):
                          fp = stringio()
                          g = email.Generator.Generator(fp, mangle_from_=False)
                          g.flatten(m)
                          fp.seek(0)
                          return fp
                      for line in stream:
                          cur.append(line)
                      c = chunk(cur)
                      m = mail.parse(c)
                      if not m.is_multipart():
                          yield msgfp(m)
                      else:
                          ok_types = ('text/plain', 'text/x-diff', 'text/x-patch')
                          for part in m.walk():
                              ct = part.get_content_type()
                              if ct not in ok_types:
                                  continue
                              yield msgfp(part)
                  def headersplit(stream, cur):
                      inheader = False
                      for line in stream:
                          if not inheader and isheader(line, inheader):
                              yield chunk(cur)
                              cur = []
                              inheader = True
                          if inheader and not isheader(line, inheader):
                              inheader = False
                          cur.append(line)
                      if cur:
                          yield chunk(cur)
                  def remainder(cur):
                      yield chunk(cur)
                  class fiter(object):
                      def __init__(self, fp):
                          self.fp = fp
                      def __iter__(self):
                          return self
                      def next(self):
                          l = self.fp.readline()
                          if not l:
                              raise StopIteration
                          return l
                      __next__ = next
                  inheader = False
                  cur = []
                  mimeheaders = ['content-type']
                  if not util.safehasattr(stream, 'next'):
                      # http responses, for example, have readline but not next
                      stream = fiter(stream)
                  for line in stream:
                      cur.append(line)
                      if line.startswith('# HG changeset patch'):
                          return hgsplit(stream, cur)
                      elif line.startswith('From '):
                          return mboxsplit(stream, cur)
                      elif isheader(line, inheader):
                          inheader = True
                          if line.split(':', 1)[0].lower() in mimeheaders:
                              # let email parser handle this
                              return mimesplit(stream, cur)
                      elif line.startswith('--- ') and inheader:
                          # No evil headers seen by diff start, split by hand
                          return headersplit(stream, cur)
                      # Not enough info, keep reading
                  # if we are here, we have a very plain patch
                  return remainder(cur)
              ## Some facility for extensible patch parsing:
              # list of pairs ("header to match", "data key")
              patchheadermap = [('Date', 'date'),
                                ('Branch', 'branch'),
                                ('Node ID', 'nodeid'),
                               ]
              @contextlib.contextmanager
              def extract(ui, fileobj):
                  '''extract patch from data read from fileobj.
                  patch can be a normal patch or contained in an email message.
                  return a dictionary. Standard keys are:
                    - filename,
                    - message,
                    - user,
                    - date,
                    - branch,
                    - node,
                    - p1,
                    - p2.
                  Any item can be missing from the dictionary. If filename is missing,
                  fileobj did not contain a patch. Caller must unlink filename when done.'''
                  fd, tmpname = pycompat.mkstemp(prefix='hg-patch-')
                  tmpfp = os.fdopen(fd, r'wb')
                  try:
                      yield _extract(ui, fileobj, tmpname, tmpfp)
                  finally:
                      tmpfp.close()
                      os.unlink(tmpname)
              def _extract(ui, fileobj, tmpname, tmpfp):
                  # attempt to detect the start of a patch
                  # (this heuristic is borrowed from quilt)
                  diffre = re.compile(br'^(?:Index:[ \t]|diff[ \t]-|RCS file: |'
                                      br'retrieving revision [0-9]+(\.[0-9]+)*$|'
                                      br'---[ \t].*?^\+\+\+[ \t]|'
                                      br'\*\*\*[ \t].*?^---[ \t])',
                                      re.MULTILINE | re.DOTALL)
                  data = {}
                  msg = mail.parse(fileobj)
                  subject = msg[r'Subject'] and mail.headdecode(msg[r'Subject'])
                  data['user'] = msg[r'From'] and mail.headdecode(msg[r'From'])
                  if not subject and not data['user']:
                      # Not an email, restore parsed headers if any
                      subject = '\n'.join(': '.join(map(encoding.strtolocal, h))
                                          for h in msg.items()) + '\n'
                  # should try to parse msg['Date']
                  parents = []
                  if subject:
                      if subject.startswith('[PATCH'):
                          pend = subject.find(']')
                          if pend >= 0:
                              subject = subject[pend + 1:].lstrip()
                      subject = re.sub(br'\n[ \t]+', ' ', subject)
                      ui.debug('Subject: %s\n' % subject)
                  if data['user']:
                      ui.debug('From: %s\n' % data['user'])
                  diffs_seen = 0
                  ok_types = ('text/plain', 'text/x-diff', 'text/x-patch')
                  message = ''
                  for part in msg.walk():
                      content_type = pycompat.bytestr(part.get_content_type())
                      ui.debug('Content-Type: %s\n' % content_type)
                      if content_type not in ok_types:
                          continue
                      payload = part.get_payload(decode=True)
                      m = diffre.search(payload)
                      if m:
                          hgpatch = False
                          hgpatchheader = False
                          ignoretext = False
                          ui.debug('found patch at byte %d\n' % m.start(0))
                          diffs_seen += 1
                          cfp = stringio()
                          for line in payload[:m.start(0)].splitlines():
                              if line.startswith('# HG changeset patch') and not hgpatch:
                                  ui.debug('patch generated by hg export\n')
                                  hgpatch = True
                                  hgpatchheader = True
                                  # drop earlier commit message content
                                  cfp.seek(0)
                                  cfp.truncate()
                                  subject = None
                              elif hgpatchheader:
                                  if line.startswith('# User '):
                                      data['user'] = line[7:]
                                      ui.debug('From: %s\n' % data['user'])
                                  elif line.startswith("# Parent "):
                                      parents.append(line[9:].lstrip())
                                  elif line.startswith("# "):
                                      for header, key in patchheadermap:
                                          prefix = '# %s ' % header
                                          if line.startswith(prefix):
                                              data[key] = line[len(prefix):]
                                  else:
                                      hgpatchheader = False
                              elif line == '---':
                                  ignoretext = True
                              if not hgpatchheader and not ignoretext:
                                  cfp.write(line)
                                  cfp.write('\n')
                          message = cfp.getvalue()
                          if tmpfp:
                              tmpfp.write(payload)
                              if not payload.endswith('\n'):
                                  tmpfp.write('\n')
                      elif not diffs_seen and message and content_type == 'text/plain':
                          message += '\n' + payload
                  if subject and not message.startswith(subject):
                      message = '%s\n%s' % (subject, message)
                  data['message'] = message
                  tmpfp.close()
                  if parents:
                      data['p1'] = parents.pop(0)
                      if parents:
                          data['p2'] = parents.pop(0)
                  if diffs_seen:
                      data['filename'] = tmpname
                  return data
              class patchmeta(object):
                  """Patched file metadata
                  'op' is the performed operation within ADD, DELETE, RENAME, MODIFY
                  or COPY.  'path' is patched file path. 'oldpath' is set to the
                  origin file when 'op' is either COPY or RENAME, None otherwise. If
                  file mode is changed, 'mode' is a tuple (islink, isexec) where
                  'islink' is True if the file is a symlink and 'isexec' is True if
                  the file is executable. Otherwise, 'mode' is None.
                  """
                  def __init__(self, path):
                      self.path = path
                      self.oldpath = None
                      self.mode = None
                      self.op = 'MODIFY'
                      self.binary = False
                  def setmode(self, mode):
                      islink = mode & 0o20000
                      isexec = mode & 0o100
                      self.mode = (islink, isexec)
                  def copy(self):
                      other = patchmeta(self.path)
                      other.oldpath = self.oldpath
                      other.mode = self.mode
                      other.op = self.op
                      other.binary = self.binary
                      return other
                  def _ispatchinga(self, afile):
                      if afile == '/dev/null':
                          return self.op == 'ADD'
                      return afile == 'a/' + (self.oldpath or self.path)
                  def _ispatchingb(self, bfile):
                      if bfile == '/dev/null':
                          return self.op == 'DELETE'
                      return bfile == 'b/' + self.path
                  def ispatching(self, afile, bfile):
                      return self._ispatchinga(afile) and self._ispatchingb(bfile)
                  def __repr__(self):
                      return "<patchmeta %s %r>" % (self.op, self.path)
              def readgitpatch(lr):
                  """extract git-style metadata about patches from <patchname>"""
                  # Filter patch for git information
                  gp = None
                  gitpatches = []
                  for line in lr:
                      line = line.rstrip(' \r\n')
                      if line.startswith('diff --git a/'):
                          m = gitre.match(line)
                          if m:
                              if gp:
                                  gitpatches.append(gp)
                              dst = m.group(2)
                              gp = patchmeta(dst)
                      elif gp:
                          if line.startswith('--- '):
                              gitpatches.append(gp)
                              gp = None
                              continue
                          if line.startswith('rename from '):
                              gp.op = 'RENAME'
                              gp.oldpath = line[12:]
                          elif line.startswith('rename to '):
                              gp.path = line[10:]
                          elif line.startswith('copy from '):
                              gp.op = 'COPY'
                              gp.oldpath = line[10:]
                          elif line.startswith('copy to '):
                              gp.path = line[8:]
                          elif line.startswith('deleted file'):
                              gp.op = 'DELETE'
                          elif line.startswith('new file mode '):
                              gp.op = 'ADD'
                              gp.setmode(int(line[-6:], 8))
                          elif line.startswith('new mode '):
                              gp.setmode(int(line[-6:], 8))
                          elif line.startswith('GIT binary patch'):
                              gp.binary = True
                  if gp:
                      gitpatches.append(gp)
                  return gitpatches
              class linereader(object):
                  # simple class to allow pushing lines back into the input stream
                  def __init__(self, fp):
                      self.fp = fp
                      self.buf = []
                  def push(self, line):
                      if line is not None:
                          self.buf.append(line)
                  def readline(self):
                      if self.buf:
                          l = self.buf[0]
                          del self.buf[0]
                          return l
                      return self.fp.readline()
                  def __iter__(self):
                      return iter(self.readline, '')
              class abstractbackend(object):
                  def __init__(self, ui):
                      self.ui = ui
                  def getfile(self, fname):
                      """Return target file data and flags as a (data, (islink,
                      isexec)) tuple. Data is None if file is missing/deleted.
                      """
                      raise NotImplementedError
                  def setfile(self, fname, data, mode, copysource):
                      """Write data to target file fname and set its mode. mode is a
                      (islink, isexec) tuple. If data is None, the file content should
                      be left unchanged. If the file is modified after being copied,
                      copysource is set to the original file name.
                      """
                      raise NotImplementedError
                  def unlink(self, fname):
                      """Unlink target file."""
                      raise NotImplementedError
                  def writerej(self, fname, failed, total, lines):
                      """Write rejected lines for fname. total is the number of hunks
                      which failed to apply and total the total number of hunks for this
                      files.
                      """
                  def exists(self, fname):
                      raise NotImplementedError
                  def close(self):
                      raise NotImplementedError
              class fsbackend(abstractbackend):
                  def __init__(self, ui, basedir):
                      super(fsbackend, self).__init__(ui)
                      self.opener = vfsmod.vfs(basedir)
                  def getfile(self, fname):
                      if self.opener.islink(fname):
                          return (self.opener.readlink(fname), (True, False))
                      isexec = False
                      try:
                          isexec = self.opener.lstat(fname).st_mode & 0o100 != 0
                      except OSError as e:
                          if e.errno != errno.ENOENT:
                              raise
                      try:
                          return (self.opener.read(fname), (False, isexec))
                      except IOError as e:
                          if e.errno != errno.ENOENT:
                              raise
                          return None, None
                  def setfile(self, fname, data, mode, copysource):
                      islink, isexec = mode
                      if data is None:
                          self.opener.setflags(fname, islink, isexec)
                          return
                      if islink:
                          self.opener.symlink(data, fname)
                      else:
                          self.opener.write(fname, data)
                          if isexec:
                              self.opener.setflags(fname, False, True)
                  def unlink(self, fname):
                      rmdir = self.ui.configbool('experimental', 'removeemptydirs')
                      self.opener.unlinkpath(fname, ignoremissing=True, rmdir=rmdir)
                  def writerej(self, fname, failed, total, lines):
                      fname = fname + ".rej"
                      self.ui.warn(
                          _("%d out of %d hunks FAILED -- saving rejects to file %s\n") %
                          (failed, total, fname))
                      fp = self.opener(fname, 'w')
                      fp.writelines(lines)
                      fp.close()
                  def exists(self, fname):
                      return self.opener.lexists(fname)
              class workingbackend(fsbackend):
                  def __init__(self, ui, repo, similarity):
                      super(workingbackend, self).__init__(ui, repo.root)
                      self.repo = repo
                      self.similarity = similarity
                      self.removed = set()
                      self.changed = set()
                      self.copied = []
                  def _checkknown(self, fname):
                      if self.repo.dirstate[fname] == '?' and self.exists(fname):
                          raise PatchError(_('cannot patch %s: file is not tracked') % fname)
                  def setfile(self, fname, data, mode, copysource):
                      self._checkknown(fname)
                      super(workingbackend, self).setfile(fname, data, mode, copysource)
                      if copysource is not None:
                          self.copied.append((copysource, fname))
                      self.changed.add(fname)
                  def unlink(self, fname):
                      self._checkknown(fname)
                      super(workingbackend, self).unlink(fname)
                      self.removed.add(fname)
                      self.changed.add(fname)
                  def close(self):
                      wctx = self.repo[None]
                      changed = set(self.changed)
                      for src, dst in self.copied:
                          scmutil.dirstatecopy(self.ui, self.repo, wctx, src, dst)
                      if self.removed:
                          wctx.forget(sorted(self.removed))
                          for f in self.removed:
                              if f not in self.repo.dirstate:
                                  # File was deleted and no longer belongs to the
                                  # dirstate, it was probably marked added then
                                  # deleted, and should not be considered by
                                  # marktouched().
                                  changed.discard(f)
                      if changed:
                          scmutil.marktouched(self.repo, changed, self.similarity)
                      return sorted(self.changed)
              class filestore(object):
                  def __init__(self, maxsize=None):
                      self.opener = None
                      self.files = {}
                      self.created = 0
                      self.maxsize = maxsize
                      if self.maxsize is None:
                          self.maxsize = 4*(2**20)
                      self.size = 0
                      self.data = {}
                  def setfile(self, fname, data, mode, copied=None):
                      if self.maxsize < 0 or (len(data) + self.size) <= self.maxsize:
                          self.data[fname] = (data, mode, copied)
                          self.size += len(data)
                      else:
                          if self.opener is None:
                              root = pycompat.mkdtemp(prefix='hg-patch-')
                              self.opener = vfsmod.vfs(root)
                          # Avoid filename issues with these simple names
                          fn = '%d' % self.created
                          self.opener.write(fn, data)
                          self.created += 1
                          self.files[fname] = (fn, mode, copied)
                  def getfile(self, fname):
                      if fname in self.data:
                          return self.data[fname]
                      if not self.opener or fname not in self.files:
                          return None, None, None
                      fn, mode, copied = self.files[fname]
                      return self.opener.read(fn), mode, copied
                  def close(self):
                      if self.opener:
                          shutil.rmtree(self.opener.base)
              class repobackend(abstractbackend):
                  def __init__(self, ui, repo, ctx, store):
                      super(repobackend, self).__init__(ui)
                      self.repo = repo
                      self.ctx = ctx
                      self.store = store
                      self.changed = set()
                      self.removed = set()
                      self.copied = {}
                  def _checkknown(self, fname):
                      if fname not in self.ctx:
                          raise PatchError(_('cannot patch %s: file is not tracked') % fname)
                  def getfile(self, fname):
                      try:
                          fctx = self.ctx[fname]
                      except error.LookupError:
                          return None, None
                      flags = fctx.flags()
                      return fctx.data(), ('l' in flags, 'x' in flags)
                  def setfile(self, fname, data, mode, copysource):
                      if copysource:
                          self._checkknown(copysource)
                      if data is None:
                          data = self.ctx[fname].data()
                      self.store.setfile(fname, data, mode, copysource)
                      self.changed.add(fname)
                      if copysource:
                          self.copied[fname] = copysource
                  def unlink(self, fname):
                      self._checkknown(fname)
                      self.removed.add(fname)
                  def exists(self, fname):
                      return fname in self.ctx
                  def close(self):
                      return self.changed | self.removed
              # @@ -start,len +start,len @@ or @@ -start +start @@ if len is 1
              unidesc = re.compile('@@ -(\d+)(?:,(\d+))? \+(\d+)(?:,(\d+))? @@')
              contextdesc = re.compile('(?:---|\*\*\*) (\d+)(?:,(\d+))? (?:---|\*\*\*)')
              eolmodes = ['strict', 'crlf', 'lf', 'auto']
              class patchfile(object):
                  def __init__(self, ui, gp, backend, store, eolmode='strict'):
                      self.fname = gp.path
                      self.eolmode = eolmode
                      self.eol = None
                      self.backend = backend
                      self.ui = ui
                      self.lines = []
                      self.exists = False
                      self.missing = True
                      self.mode = gp.mode
                      self.copysource = gp.oldpath
                      self.create = gp.op in ('ADD', 'COPY', 'RENAME')
                      self.remove = gp.op == 'DELETE'
                      if self.copysource is None:
                          data, mode = backend.getfile(self.fname)
                      else:
                          data, mode = store.getfile(self.copysource)[:2]
                      if data is not None:
                          self.exists = self.copysource is None or backend.exists(self.fname)
                          self.missing = False
                          if data:
                              self.lines = mdiff.splitnewlines(data)
                          if self.mode is None:
                              self.mode = mode
                          if self.lines:
                              # Normalize line endings
                              if self.lines[0].endswith('\r\n'):
                                  self.eol = '\r\n'
                              elif self.lines[0].endswith('\n'):
                                  self.eol = '\n'
                              if eolmode != 'strict':
                                  nlines = []
                                  for l in self.lines:
                                      if l.endswith('\r\n'):
                                          l = l[:-2] + '\n'
                                      nlines.append(l)
                                  self.lines = nlines
                      else:
                          if self.create:
                              self.missing = False
                          if self.mode is None:
                              self.mode = (False, False)
                      if self.missing:
                          self.ui.warn(_("unable to find '%s' for patching\n") % self.fname)
                          self.ui.warn(_("(use '--prefix' to apply patch relative to the "
                                         "current directory)\n"))
                      self.hash = {}
                      self.dirty = 0
                      self.offset = 0
                      self.skew = 0
                      self.rej = []
                      self.fileprinted = False
                      self.printfile(False)
                      self.hunks = 0
                  def writelines(self, fname, lines, mode):
                      if self.eolmode == 'auto':
                          eol = self.eol
                      elif self.eolmode == 'crlf':
                          eol = '\r\n'
                      else:
                          eol = '\n'
                      if self.eolmode != 'strict' and eol and eol != '\n':
                          rawlines = []
                          for l in lines:
                              if l and l.endswith('\n'):
                                  l = l[:-1] + eol
                              rawlines.append(l)
                          lines = rawlines
                      self.backend.setfile(fname, ''.join(lines), mode, self.copysource)
                  def printfile(self, warn):
                      if self.fileprinted:
                          return
                      if warn or self.ui.verbose:
                          self.fileprinted = True
                      s = _("patching file %s\n") % self.fname
                      if warn:
                          self.ui.warn(s)
                      else:
                          self.ui.note(s)
                  def findlines(self, l, linenum):
                      # looks through the hash and finds candidate lines.  The
                      # result is a list of line numbers sorted based on distance
                      # from linenum
                      cand = self.hash.get(l, [])
                      if len(cand) > 1:
                          # resort our list of potentials forward then back.
                          cand.sort(key=lambda x: abs(x - linenum))
                      return cand
                  def write_rej(self):
                      # our rejects are a little different from patch(1).  This always
                      # creates rejects in the same form as the original patch.  A file
                      # header is inserted so that you can run the reject through patch again
                      # without having to type the filename.
                      if not self.rej:
                          return
                      base = os.path.basename(self.fname)
                      lines = ["--- %s\n+++ %s\n" % (base, base)]
                      for x in self.rej:
                          for l in x.hunk:
                              lines.append(l)
                              if l[-1:] != '\n':
                                  lines.append("\n\ No newline at end of file\n")
                      self.backend.writerej(self.fname, len(self.rej), self.hunks, lines)
                  def apply(self, h):
                      if not h.complete():
                          raise PatchError(_("bad hunk #%d %s (%d %d %d %d)") %
                                          (h.number, h.desc, len(h.a), h.lena, len(h.b),
                                          h.lenb))
                      self.hunks += 1
                      if self.missing:
                          self.rej.append(h)
                          return -1
                      if self.exists and self.create:
                          if self.copysource:
                              self.ui.warn(_("cannot create %s: destination already "
                                             "exists\n") % self.fname)
                          else:
                              self.ui.warn(_("file %s already exists\n") % self.fname)
                          self.rej.append(h)
                          return -1
                      if isinstance(h, binhunk):
                          if self.remove:
                              self.backend.unlink(self.fname)
                          else:
                              l = h.new(self.lines)
                              self.lines[:] = l
                              self.offset += len(l)
                              self.dirty = True
                          return 0
                      horig = h
                      if (self.eolmode in ('crlf', 'lf')
                          or self.eolmode == 'auto' and self.eol):
                          # If new eols are going to be normalized, then normalize
                          # hunk data before patching. Otherwise, preserve input
                          # line-endings.
                          h = h.getnormalized()
                      # fast case first, no offsets, no fuzz
                      old, oldstart, new, newstart = h.fuzzit(0, False)
                      oldstart += self.offset
                      orig_start = oldstart
                      # if there's skew we want to emit the "(offset %d lines)" even
                      # when the hunk cleanly applies at start + skew, so skip the
                      # fast case code
                      if self.skew == 0 and diffhelper.testhunk(old, self.lines, oldstart):
                          if self.remove:
                              self.backend.unlink(self.fname)
                          else:
                              self.lines[oldstart:oldstart + len(old)] = new
                              self.offset += len(new) - len(old)
                              self.dirty = True
                          return 0
                      # ok, we couldn't match the hunk. Lets look for offsets and fuzz it
                      self.hash = {}
                      for x, s in enumerate(self.lines):
                          self.hash.setdefault(s, []).append(x)
                      for fuzzlen in xrange(self.ui.configint("patch", "fuzz") + 1):
                          for toponly in [True, False]:
                              old, oldstart, new, newstart = h.fuzzit(fuzzlen, toponly)
                              oldstart = oldstart + self.offset + self.skew
                              oldstart = min(oldstart, len(self.lines))
                              if old:
                                  cand = self.findlines(old[0][1:], oldstart)
                              else:
                                  # Only adding lines with no or fuzzed context, just
                                  # take the skew in account
                                  cand = [oldstart]
                              for l in cand:
                                  if not old or diffhelper.testhunk(old, self.lines, l):
                                      self.lines[l : l + len(old)] = new
                                      self.offset += len(new) - len(old)
                                      self.skew = l - orig_start
                                      self.dirty = True
                                      offset = l - orig_start - fuzzlen
                                      if fuzzlen:
                                          msg = _("Hunk #%d succeeded at %d "
                                                  "with fuzz %d "
                                                  "(offset %d lines).\n")
                                          self.printfile(True)
                                          self.ui.warn(msg %
                                              (h.number, l + 1, fuzzlen, offset))
                                      else:
                                          msg = _("Hunk #%d succeeded at %d "
                                                  "(offset %d lines).\n")
                                          self.ui.note(msg % (h.number, l + 1, offset))
                                      return fuzzlen
                      self.printfile(True)
                      self.ui.warn(_("Hunk #%d FAILED at %d\n") % (h.number, orig_start))
                      self.rej.append(horig)
                      return -1
                  def close(self):
                      if self.dirty:
                          self.writelines(self.fname, self.lines, self.mode)
                      self.write_rej()
                      return len(self.rej)
              class header(object):
                  """patch header
                  """
                  diffgit_re = re.compile('diff --git a/(.*) b/(.*)$')
                  diff_re = re.compile('diff -r .* (.*)$')
                  allhunks_re = re.compile('(?:index|deleted file) ')
                  pretty_re = re.compile('(?:new file|deleted file) ')
                  special_re = re.compile('(?:index|deleted|copy|rename) ')
                  newfile_re = re.compile('(?:new file)')
                  def __init__(self, header):
                      self.header = header
                      self.hunks = []
                  def binary(self):
                      return any(h.startswith('index ') for h in self.header)
                  def pretty(self, fp):
                      for h in self.header:
                          if h.startswith('index '):
                              fp.write(_('this modifies a binary file (all or nothing)\n'))
                              break
                          if self.pretty_re.match(h):
                              fp.write(h)
                              if self.binary():
                                  fp.write(_('this is a binary file\n'))
                              break
                          if h.startswith('---'):
                              fp.write(_('%d hunks, %d lines changed\n') %
                                       (len(self.hunks),
                                        sum([max(h.added, h.removed) for h in self.hunks])))
                              break
                          fp.write(h)
                  def write(self, fp):
                      fp.write(''.join(self.header))
                  def allhunks(self):
                      return any(self.allhunks_re.match(h) for h in self.header)
                  def files(self):
                      match = self.diffgit_re.match(self.header[0])
                      if match:
                          fromfile, tofile = match.groups()
                          if fromfile == tofile:
                              return [fromfile]
                          return [fromfile, tofile]
                      else:
                          return self.diff_re.match(self.header[0]).groups()
                  def filename(self):
                      return self.files()[-1]
                  def __repr__(self):
                      return '<header %s>' % (' '.join(map(repr, self.files())))
                  def isnewfile(self):
                      return any(self.newfile_re.match(h) for h in self.header)
                  def special(self):
                      # Special files are shown only at the header level and not at the hunk
                      # level for example a file that has been deleted is a special file.
                      # The user cannot change the content of the operation, in the case of
                      # the deleted file he has to take the deletion or not take it, he
                      # cannot take some of it.
                      # Newly added files are special if they are empty, they are not special
                      # if they have some content as we want to be able to change it
                      nocontent = len(self.header) == 2
                      emptynewfile = self.isnewfile() and nocontent
                      return emptynewfile or \
                              any(self.special_re.match(h) for h in self.header)
              class recordhunk(object):
                  """patch hunk
                  XXX shouldn't we merge this with the other hunk class?
                  """
                  def __init__(self, header, fromline, toline, proc, before, hunk, after,
                               maxcontext=None):
                      def trimcontext(lines, reverse=False):
                          if maxcontext is not None:
                              delta = len(lines) - maxcontext
                              if delta > 0:
                                  if reverse:
                                      return delta, lines[delta:]
                                  else:
                                      return delta, lines[:maxcontext]
                          return 0, lines
                      self.header = header
                      trimedbefore, self.before = trimcontext(before, True)
                      self.fromline = fromline + trimedbefore
                      self.toline = toline + trimedbefore
                      _trimedafter, self.after = trimcontext(after, False)
                      self.proc = proc
                      self.hunk = hunk
                      self.added, self.removed = self.countchanges(self.hunk)
                  def __eq__(self, v):
                      if not isinstance(v, recordhunk):
                          return False
                      return ((v.hunk == self.hunk) and
                              (v.proc == self.proc) and
                              (self.fromline == v.fromline) and
                              (self.header.files() == v.header.files()))
                  def __hash__(self):
                      return hash((tuple(self.hunk),
                          tuple(self.header.files()),
                          self.fromline,
                          self.proc))
                  def countchanges(self, hunk):
                      """hunk -> (n+,n-)"""
                      add = len([h for h in hunk if h.startswith('+')])
                      rem = len([h for h in hunk if h.startswith('-')])
                      return add, rem
                  def reversehunk(self):
                      """return another recordhunk which is the reverse of the hunk
                      If this hunk is diff(A, B), the returned hunk is diff(B, A). To do
                      that, swap fromline/toline and +/- signs while keep other things
                      unchanged.
                      """
                      m = {'+': '-', '-': '+', '\\': '\\'}
                      hunk = ['%s%s' % (m[l[0:1]], l[1:]) for l in self.hunk]
                      return recordhunk(self.header, self.toline, self.fromline, self.proc,
                                        self.before, hunk, self.after)
                  def write(self, fp):
                      delta = len(self.before) + len(self.after)
                      if self.after and self.after[-1] == '\\ No newline at end of file\n':
                          delta -= 1
                      fromlen = delta + self.removed
                      tolen = delta + self.added
                      fp.write('@@ -%d,%d +%d,%d @@%s\n' %
                               (self.fromline, fromlen, self.toline, tolen,
                                self.proc and (' ' + self.proc)))
                      fp.write(''.join(self.before + self.hunk + self.after))
                  pretty = write
                  def filename(self):
                      return self.header.filename()
                  def __repr__(self):
                      return '<hunk %r@%d>' % (self.filename(), self.fromline)
              def getmessages():
                  return {
                      'multiple': {
                          'apply': _("apply change %d/%d to '%s'?"),
                          'discard': _("discard change %d/%d to '%s'?"),
                          'record': _("record change %d/%d to '%s'?"),
                      },
                      'single': {
                          'apply': _("apply this change to '%s'?"),
                          'discard': _("discard this change to '%s'?"),
                          'record': _("record this change to '%s'?"),
                      },
                      'help': {
                          'apply': _('[Ynesfdaq?]'
                                       '$$ &Yes, apply this change'
                                       '$$ &No, skip this change'
                                       '$$ &Edit this change manually'
                                       '$$ &Skip remaining changes to this file'
                                       '$$ Apply remaining changes to this &file'
                                       '$$ &Done, skip remaining changes and files'
                                       '$$ Apply &all changes to all remaining files'
                                       '$$ &Quit, applying no changes'
                                       '$$ &? (display help)'),
                          'discard': _('[Ynesfdaq?]'
                                       '$$ &Yes, discard this change'
                                       '$$ &No, skip this change'
                                       '$$ &Edit this change manually'
                                       '$$ &Skip remaining changes to this file'
                                       '$$ Discard remaining changes to this &file'
                                       '$$ &Done, skip remaining changes and files'
                                       '$$ Discard &all changes to all remaining files'
                                       '$$ &Quit, discarding no changes'
                                       '$$ &? (display help)'),
                          'record': _('[Ynesfdaq?]'
                                      '$$ &Yes, record this change'
                                      '$$ &No, skip this change'
                                      '$$ &Edit this change manually'
                                      '$$ &Skip remaining changes to this file'
                                      '$$ Record remaining changes to this &file'
                                      '$$ &Done, skip remaining changes and files'
                                      '$$ Record &all changes to all remaining files'
                                      '$$ &Quit, recording no changes'
                                      '$$ &? (display help)'),
                      }
                  }
              def filterpatch(ui, headers, operation=None):
                  """Interactively filter patch chunks into applied-only chunks"""
                  messages = getmessages()
                  if operation is None:
                      operation = 'record'
                  def prompt(skipfile, skipall, query, chunk):
                      """prompt query, and process base inputs
                      - y/n for the rest of file
                      - y/n for the rest
                      - ? (help)
                      - q (quit)
                      Return True/False and possibly updated skipfile and skipall.
                      """
                      newpatches = None
                      if skipall is not None:
                          return skipall, skipfile, skipall, newpatches
                      if skipfile is not None:
                          return skipfile, skipfile, skipall, newpatches
                      while True:
                          resps = messages['help'][operation]
                          r = ui.promptchoice("%s %s" % (query, resps))
                          ui.write("\n")
                          if r == 8: # ?
                              for c, t in ui.extractchoices(resps)[1]:
                                  ui.write('%s - %s\n' % (c, encoding.lower(t)))
                              continue
                          elif r == 0: # yes
                              ret = True
                          elif r == 1: # no
                              ret = False
                          elif r == 2: # Edit patch
                              if chunk is None:
                                  ui.write(_('cannot edit patch for whole file'))
                                  ui.write("\n")
                                  continue
                              if chunk.header.binary():
                                  ui.write(_('cannot edit patch for binary file'))
                                  ui.write("\n")
                                  continue
                              # Patch comment based on the Git one (based on comment at end of
                              # https://mercurial-scm.org/wiki/RecordExtension)
                              phelp = '---' + _("""
              To remove '-' lines, make them ' ' lines (context).
              To remove '+' lines, delete them.
              Lines starting with # will be removed from the patch.
              If the patch applies cleanly, the edited hunk will immediately be
              added to the record list. If it does not apply cleanly, a rejects
              file will be generated: you can use that when you try again. If
              all lines of the hunk are removed, then the edit is aborted and
              the hunk is left unchanged.
              """)
                              (patchfd, patchfn) = pycompat.mkstemp(prefix="hg-editor-",
                                                                    suffix=".diff")
                              ncpatchfp = None
                              try:
                                  # Write the initial patch
                                  f = util.nativeeolwriter(os.fdopen(patchfd, r'wb'))
                                  chunk.header.write(f)
                                  chunk.write(f)
                                  f.write('\n'.join(['# ' + i for i in phelp.splitlines()]))
                                  f.close()
                                  # Start the editor and wait for it to complete
                                  editor = ui.geteditor()
                                  ret = ui.system("%s \"%s\"" % (editor, patchfn),
                                                  environ={'HGUSER': ui.username()},
                                                  blockedtag='filterpatch')
                                  if ret != 0:
                                      ui.warn(_("editor exited with exit code %d\n") % ret)
                                      continue
                                  # Remove comment lines
                                  patchfp = open(patchfn, r'rb')
                                  ncpatchfp = stringio()
                                  for line in util.iterfile(patchfp):
                                      line = util.fromnativeeol(line)
                                      if not line.startswith('#'):
                                          ncpatchfp.write(line)
                                  patchfp.close()
                                  ncpatchfp.seek(0)
                                  newpatches = parsepatch(ncpatchfp)
                              finally:
                                  os.unlink(patchfn)
                                  del ncpatchfp
                              # Signal that the chunk shouldn't be applied as-is, but
                              # provide the new patch to be used instead.
                              ret = False
                          elif r == 3: # Skip
                              ret = skipfile = False
                          elif r == 4: # file (Record remaining)
                              ret = skipfile = True
                          elif r == 5: # done, skip remaining
                              ret = skipall = False
                          elif r == 6: # all
                              ret = skipall = True
                          elif r == 7: # quit
                              raise error.Abort(_('user quit'))
                          return ret, skipfile, skipall, newpatches
                  seen = set()
                  applied = {}        # 'filename' -> [] of chunks
                  skipfile, skipall = None, None
                  pos, total = 1, sum(len(h.hunks) for h in headers)
                  for h in headers:
                      pos += len(h.hunks)
                      skipfile = None
                      fixoffset = 0
                      hdr = ''.join(h.header)
                      if hdr in seen:
                          continue
                      seen.add(hdr)
                      if skipall is None:
                          h.pretty(ui)
                      msg = (_('examine changes to %s?') %
                             _(' and ').join("'%s'" % f for f in h.files()))
                      r, skipfile, skipall, np = prompt(skipfile, skipall, msg, None)
                      if not r:
                          continue
                      applied[h.filename()] = [h]
                      if h.allhunks():
                          applied[h.filename()] += h.hunks
                          continue
                      for i, chunk in enumerate(h.hunks):
                          if skipfile is None and skipall is None:
                              chunk.pretty(ui)
                          if total == 1:
                              msg = messages['single'][operation] % chunk.filename()
                          else:
                              idx = pos - len(h.hunks) + i
                              msg = messages['multiple'][operation] % (idx, total,
                                                                       chunk.filename())
                          r, skipfile, skipall, newpatches = prompt(skipfile,
                                  skipall, msg, chunk)
                          if r:
                              if fixoffset:
                                  chunk = copy.copy(chunk)
                                  chunk.toline += fixoffset
                              applied[chunk.filename()].append(chunk)
                          elif newpatches is not None:
                              for newpatch in newpatches:
                                  for newhunk in newpatch.hunks:
                                      if fixoffset:
                                          newhunk.toline += fixoffset
                                      applied[newhunk.filename()].append(newhunk)
                          else:
                              fixoffset += chunk.removed - chunk.added
                  return (sum([h for h in applied.itervalues()
                             if h[0].special() or len(h) > 1], []), {})
              class hunk(object):
                  def __init__(self, desc, num, lr, context):
                      self.number = num
                      self.desc = desc
                      self.hunk = [desc]
                      self.a = []
                      self.b = []
                      self.starta = self.lena = None
                      self.startb = self.lenb = None
                      if lr is not None:
                          if context:
                              self.read_context_hunk(lr)
                          else:
                              self.read_unified_hunk(lr)
                  def getnormalized(self):
                      """Return a copy with line endings normalized to LF."""
                      def normalize(lines):
                          nlines = []
                          for line in lines:
                              if line.endswith('\r\n'):
                                  line = line[:-2] + '\n'
                              nlines.append(line)
                          return nlines
                      # Dummy object, it is rebuilt manually
                      nh = hunk(self.desc, self.number, None, None)
                      nh.number = self.number
                      nh.desc = self.desc
                      nh.hunk = self.hunk
                      nh.a = normalize(self.a)
                      nh.b = normalize(self.b)
                      nh.starta = self.starta
                      nh.startb = self.startb
                      nh.lena = self.lena
                      nh.lenb = self.lenb
                      return nh
                  def read_unified_hunk(self, lr):
                      m = unidesc.match(self.desc)
                      if not m:
                          raise PatchError(_("bad hunk #%d") % self.number)
                      self.starta, self.lena, self.startb, self.lenb = m.groups()
                      if self.lena is None:
                          self.lena = 1
                      else:
                          self.lena = int(self.lena)
                      if self.lenb is None:
                          self.lenb = 1
                      else:
                          self.lenb = int(self.lenb)
                      self.starta = int(self.starta)
                      self.startb = int(self.startb)
                      try:
                          diffhelper.addlines(lr, self.hunk, self.lena, self.lenb,
                                              self.a, self.b)
                      except error.ParseError as e:
                          raise PatchError(_("bad hunk #%d: %s") % (self.number, e))
                      # if we hit eof before finishing out the hunk, the last line will
                      # be zero length.  Lets try to fix it up.
                      while len(self.hunk[-1]) == 0:
                          del self.hunk[-1]
                          del self.a[-1]
                          del self.b[-1]
                          self.lena -= 1
                          self.lenb -= 1
                      self._fixnewline(lr)
                  def read_context_hunk(self, lr):
                      self.desc = lr.readline()
                      m = contextdesc.match(self.desc)
                      if not m:
                          raise PatchError(_("bad hunk #%d") % self.number)
                      self.starta, aend = m.groups()
                      self.starta = int(self.starta)
                      if aend is None:
                          aend = self.starta
                      self.lena = int(aend) - self.starta
                      if self.starta:
                          self.lena += 1
                      for x in xrange(self.lena):
                          l = lr.readline()
                          if l.startswith('---'):
                              # lines addition, old block is empty
                              lr.push(l)
                              break
                          s = l[2:]
                          if l.startswith('- ') or l.startswith('! '):
                              u = '-' + s
                          elif l.startswith('  '):
                              u = ' ' + s
                          else:
                              raise PatchError(_("bad hunk #%d old text line %d") %
                                               (self.number, x))
                          self.a.append(u)
                          self.hunk.append(u)
                      l = lr.readline()
                      if l.startswith('\ '):
                          s = self.a[-1][:-1]
                          self.a[-1] = s
                          self.hunk[-1] = s
                          l = lr.readline()
                      m = contextdesc.match(l)
                      if not m:
                          raise PatchError(_("bad hunk #%d") % self.number)
                      self.startb, bend = m.groups()
                      self.startb = int(self.startb)
                      if bend is None:
                          bend = self.startb
                      self.lenb = int(bend) - self.startb
                      if self.startb:
                          self.lenb += 1
                      hunki = 1
                      for x in xrange(self.lenb):
                          l = lr.readline()
                          if l.startswith('\ '):
                              # XXX: the only way to hit this is with an invalid line range.
                              # The no-eol marker is not counted in the line range, but I
                              # guess there are diff(1) out there which behave differently.
                              s = self.b[-1][:-1]
                              self.b[-1] = s
                              self.hunk[hunki - 1] = s
                              continue
                          if not l:
                              # line deletions, new block is empty and we hit EOF
                              lr.push(l)
                              break
                          s = l[2:]
                          if l.startswith('+ ') or l.startswith('! '):
                              u = '+' + s
                          elif l.startswith('  '):
                              u = ' ' + s
                          elif len(self.b) == 0:
                              # line deletions, new block is empty
                              lr.push(l)
                              break
                          else:
                              raise PatchError(_("bad hunk #%d old text line %d") %
                                               (self.number, x))
                          self.b.append(s)
                          while True:
                              if hunki >= len(self.hunk):
                                  h = ""
                              else:
                                  h = self.hunk[hunki]
                              hunki += 1
                              if h == u:
                                  break
                              elif h.startswith('-'):
                                  continue
                              else:
                                  self.hunk.insert(hunki - 1, u)
                                  break
                      if not self.a:
                          # this happens when lines were only added to the hunk
                          for x in self.hunk:
                              if x.startswith('-') or x.startswith(' '):
                                  self.a.append(x)
                      if not self.b:
                          # this happens when lines were only deleted from the hunk
                          for x in self.hunk:
                              if x.startswith('+') or x.startswith(' '):
                                  self.b.append(x[1:])
                      # @@ -start,len +start,len @@
                      self.desc = "@@ -%d,%d +%d,%d @@\n" % (self.starta, self.lena,
                                                           self.startb, self.lenb)
                      self.hunk[0] = self.desc
                      self._fixnewline(lr)
                  def _fixnewline(self, lr):
                      l = lr.readline()
                      if l.startswith('\ '):
                          diffhelper.fixnewline(self.hunk, self.a, self.b)
                      else:
                          lr.push(l)
                  def complete(self):
                      return len(self.a) == self.lena and len(self.b) == self.lenb
                  def _fuzzit(self, old, new, fuzz, toponly):
                      # this removes context lines from the top and bottom of list 'l'.  It
                      # checks the hunk to make sure only context lines are removed, and then
                      # returns a new shortened list of lines.
                      fuzz = min(fuzz, len(old))
                      if fuzz:
                          top = 0
                          bot = 0
                          hlen = len(self.hunk)
                          for x in xrange(hlen - 1):
                              # the hunk starts with the @@ line, so use x+1
                              if self.hunk[x + 1].startswith(' '):
                                  top += 1
                              else:
                                  break
                          if not toponly:
                              for x in xrange(hlen - 1):
                                  if self.hunk[hlen - bot - 1].startswith(' '):
                                      bot += 1
                                  else:
                                      break
                          bot = min(fuzz, bot)
                          top = min(fuzz, top)
                          return old[top:len(old) - bot], new[top:len(new) - bot], top
                      return old, new, 0
                  def fuzzit(self, fuzz, toponly):
                      old, new, top = self._fuzzit(self.a, self.b, fuzz, toponly)
                      oldstart = self.starta + top
                      newstart = self.startb + top
                      # zero length hunk ranges already have their start decremented
                      if self.lena and oldstart > 0:
                          oldstart -= 1
                      if self.lenb and newstart > 0:
                          newstart -= 1
                      return old, oldstart, new, newstart
              class binhunk(object):
                  'A binary patch file.'
                  def __init__(self, lr, fname):
                      self.text = None
                      self.delta = False
                      self.hunk = ['GIT binary patch\n']
                      self._fname = fname
                      self._read(lr)
                  def complete(self):
                      return self.text is not None
                  def new(self, lines):
                      if self.delta:
                          return [applybindelta(self.text, ''.join(lines))]
                      return [self.text]
                  def _read(self, lr):
                      def getline(lr, hunk):
                          l = lr.readline()
                          hunk.append(l)
                          return l.rstrip('\r\n')
                      size = 0
                      while True:
                          line = getline(lr, self.hunk)
                          if not line:
                              raise PatchError(_('could not extract "%s" binary data')
                                               % self._fname)
                          if line.startswith('literal '):
                              size = int(line[8:].rstrip())
                              break
                          if line.startswith('delta '):
                              size = int(line[6:].rstrip())
                              self.delta = True
                              break
                      dec = []
                      line = getline(lr, self.hunk)
                      while len(line) > 1:
                          l = line[0:1]
                          if l <= 'Z' and l >= 'A':
                              l = ord(l) - ord('A') + 1
                          else:
                              l = ord(l) - ord('a') + 27
                          try:
                              dec.append(util.b85decode(line[1:])[:l])
                          except ValueError as e:
                              raise PatchError(_('could not decode "%s" binary patch: %s')
                                               % (self._fname, stringutil.forcebytestr(e)))
                          line = getline(lr, self.hunk)
                      text = zlib.decompress(''.join(dec))
                      if len(text) != size:
                          raise PatchError(_('"%s" length is %d bytes, should be %d')
                                           % (self._fname, len(text), size))
                      self.text = text
              def parsefilename(str):
                  # --- filename \t|space stuff
                  s = str[4:].rstrip('\r\n')
                  i = s.find('\t')
                  if i < 0:
                      i = s.find(' ')
                      if i < 0:
                          return s
                  return s[:i]
              def reversehunks(hunks):
                  '''reverse the signs in the hunks given as argument
                  This function operates on hunks coming out of patch.filterpatch, that is
                  a list of the form: [header1, hunk1, hunk2, header2...]. Example usage:
                  >>> rawpatch = b"""diff --git a/folder1/g b/folder1/g
                  ... --- a/folder1/g
                  ... +++ b/folder1/g
                  ... @@ -1,7 +1,7 @@
                  ... +firstline
                  ...  c
                  ...  1
                  ...  2
                  ... + 3
                  ... -4
                  ...  5
                  ...  d
                  ... +lastline"""
                  >>> hunks = parsepatch([rawpatch])
                  >>> hunkscomingfromfilterpatch = []
                  >>> for h in hunks:
                  ...     hunkscomingfromfilterpatch.append(h)
                  ...     hunkscomingfromfilterpatch.extend(h.hunks)
                  >>> reversedhunks = reversehunks(hunkscomingfromfilterpatch)
                  >>> from . import util
                  >>> fp = util.stringio()
                  >>> for c in reversedhunks:
                  ...      c.write(fp)
                  >>> fp.seek(0) or None
                  >>> reversedpatch = fp.read()
                  >>> print(pycompat.sysstr(reversedpatch))
                  diff --git a/folder1/g b/folder1/g
                  --- a/folder1/g
                  +++ b/folder1/g
@@ -1,4 +1,3 @@
                  -firstline
                   c
 
 
@@ -2,6 +1,6 @@
                   c
 
 
                  - 3
                  +4
 
                   d
@@ -6,3 +5,2 @@
 
                   d
                  -lastline
                  '''
                  newhunks = []
                  for c in hunks:
                      if util.safehasattr(c, 'reversehunk'):
                          c = c.reversehunk()
                      newhunks.append(c)
                  return newhunks
              def parsepatch(originalchunks, maxcontext=None):
                  """patch -> [] of headers -> [] of hunks
                  If maxcontext is not None, trim context lines if necessary.
                  >>> rawpatch = b'''diff --git a/folder1/g b/folder1/g
                  ... --- a/folder1/g
                  ... +++ b/folder1/g
                  ... @@ -1,8 +1,10 @@
                  ...  1
                  ...  2
                  ... -3
                  ...  4
                  ...  5
                  ...  6
                  ... +6.1
                  ... +6.2
                  ...  7
                  ...  8
                  ... +9'''
                  >>> out = util.stringio()
                  >>> headers = parsepatch([rawpatch], maxcontext=1)
                  >>> for header in headers:
                  ...     header.write(out)
                  ...     for hunk in header.hunks:
                  ...         hunk.write(out)
                  >>> print(pycompat.sysstr(out.getvalue()))
                  diff --git a/folder1/g b/folder1/g
                  --- a/folder1/g
                  +++ b/folder1/g
@@ -2,3 +2,2 @@
 
                  -3
 
@@ -6,2 +5,4 @@
 
                  +6.1
                  +6.2
 
@@ -8,1 +9,2 @@
 
                  +9
                  """
                  class parser(object):
                      """patch parsing state machine"""
                      def __init__(self):
                          self.fromline = 0
                          self.toline = 0
                          self.proc = ''
                          self.header = None
                          self.context = []
                          self.before = []
                          self.hunk = []
                          self.headers = []
                      def addrange(self, limits):
                          fromstart, fromend, tostart, toend, proc = limits
                          self.fromline = int(fromstart)
                          self.toline = int(tostart)
                          self.proc = proc
                      def addcontext(self, context):
                          if self.hunk:
                              h = recordhunk(self.header, self.fromline, self.toline,
                                      self.proc, self.before, self.hunk, context, maxcontext)
                              self.header.hunks.append(h)
                              self.fromline += len(self.before) + h.removed
                              self.toline += len(self.before) + h.added
                              self.before = []
                              self.hunk = []
                          self.context = context
                      def addhunk(self, hunk):
                          if self.context:
                              self.before = self.context
                              self.context = []
                          self.hunk = hunk
                      def newfile(self, hdr):
                          self.addcontext([])
                          h = header(hdr)
                          self.headers.append(h)
                          self.header = h
                      def addother(self, line):
                          pass # 'other' lines are ignored
                      def finished(self):
                          self.addcontext([])
                          return self.headers
                      transitions = {
                          'file': {'context': addcontext,
                                   'file': newfile,
                                   'hunk': addhunk,
                                   'range': addrange},
                          'context': {'file': newfile,
                                      'hunk': addhunk,
                                      'range': addrange,
                                      'other': addother},
                          'hunk': {'context': addcontext,
                                   'file': newfile,
                                   'range': addrange},
                          'range': {'context': addcontext,
                                    'hunk': addhunk},
                          'other': {'other': addother},
                          }
                  p = parser()
                  fp = stringio()
                  fp.write(''.join(originalchunks))
                  fp.seek(0)
                  state = 'context'
                  for newstate, data in scanpatch(fp):
                      try:
                          p.transitions[state][newstate](p, data)
                      except KeyError:
                          raise PatchError('unhandled transition: %s -> %s' %
                                                 (state, newstate))
                      state = newstate
                  del fp
                  return p.finished()
              def pathtransform(path, strip, prefix):
                  '''turn a path from a patch into a path suitable for the repository
                  prefix, if not empty, is expected to be normalized with a / at the end.
                  Returns (stripped components, path in repository).
                  >>> pathtransform(b'a/b/c', 0, b'')
                  ('', 'a/b/c')
                  >>> pathtransform(b'   a/b/c   ', 0, b'')
                  ('', '   a/b/c')
                  >>> pathtransform(b'   a/b/c   ', 2, b'')
                  ('a/b/', 'c')
                  >>> pathtransform(b'a/b/c', 0, b'd/e/')
                  ('', 'd/e/a/b/c')
                  >>> pathtransform(b'   a//b/c   ', 2, b'd/e/')
                  ('a//b/', 'd/e/c')
                  >>> pathtransform(b'a/b/c', 3, b'')
                  Traceback (most recent call last):
                  PatchError: unable to strip away 1 of 3 dirs from a/b/c
                  '''
                  pathlen = len(path)
                  i = 0
                  if strip == 0:
                      return '', prefix + path.rstrip()
                  count = strip
                  while count > 0:
                      i = path.find('/', i)
                      if i == -1:
                          raise PatchError(_("unable to strip away %d of %d dirs from %s") %
                                           (count, strip, path))
                      i += 1
                      # consume '//' in the path
                      while i < pathlen - 1 and path[i:i + 1] == '/':
                          i += 1
                      count -= 1
                  return path[:i].lstrip(), prefix + path[i:].rstrip()
              def makepatchmeta(backend, afile_orig, bfile_orig, hunk, strip, prefix):
                  nulla = afile_orig == "/dev/null"
                  nullb = bfile_orig == "/dev/null"
                  create = nulla and hunk.starta == 0 and hunk.lena == 0
                  remove = nullb and hunk.startb == 0 and hunk.lenb == 0
                  abase, afile = pathtransform(afile_orig, strip, prefix)
                  gooda = not nulla and backend.exists(afile)
                  bbase, bfile = pathtransform(bfile_orig, strip, prefix)
                  if afile == bfile:
                      goodb = gooda
                  else:
                      goodb = not nullb and backend.exists(bfile)
                  missing = not goodb and not gooda and not create
                  # some diff programs apparently produce patches where the afile is
                  # not /dev/null, but afile starts with bfile
                  abasedir = afile[:afile.rfind('/') + 1]
                  bbasedir = bfile[:bfile.rfind('/') + 1]
                  if (missing and abasedir == bbasedir and afile.startswith(bfile)
                      and hunk.starta == 0 and hunk.lena == 0):
                      create = True
                      missing = False
                  # If afile is "a/b/foo" and bfile is "a/b/foo.orig" we assume the
                  # diff is between a file and its backup. In this case, the original
                  # file should be patched (see original mpatch code).
                  isbackup = (abase == bbase and bfile.startswith(afile))
                  fname = None
                  if not missing:
                      if gooda and goodb:
                          if isbackup:
                              fname = afile
                          else:
                              fname = bfile
                      elif gooda:
                          fname = afile
                  if not fname:
                      if not nullb:
                          if isbackup:
                              fname = afile
                          else:
                              fname = bfile
                      elif not nulla:
                          fname = afile
                      else:
                          raise PatchError(_("undefined source and destination files"))
                  gp = patchmeta(fname)
                  if create:
                      gp.op = 'ADD'
                  elif remove:
                      gp.op = 'DELETE'
                  return gp
              def scanpatch(fp):
                  """like patch.iterhunks, but yield different events
                  - ('file',    [header_lines + fromfile + tofile])
                  - ('context', [context_lines])
                  - ('hunk',    [hunk_lines])
                  - ('range',   (-start,len, +start,len, proc))
                  """
                  lines_re = re.compile(br'@@ -(\d+),(\d+) \+(\d+),(\d+) @@\s*(.*)')
                  lr = linereader(fp)
                  def scanwhile(first, p):
                      """scan lr while predicate holds"""
                      lines = [first]
                      for line in iter(lr.readline, ''):
                          if p(line):
                              lines.append(line)
                          else:
                              lr.push(line)
                              break
                      return lines
                  for line in iter(lr.readline, ''):
                      if line.startswith('diff --git a/') or line.startswith('diff -r '):
                          def notheader(line):
                              s = line.split(None, 1)
                              return not s or s[0] not in ('---', 'diff')
                          header = scanwhile(line, notheader)
                          fromfile = lr.readline()
                          if fromfile.startswith('---'):
                              tofile = lr.readline()
                              header += [fromfile, tofile]
                          else:
                              lr.push(fromfile)
                          yield 'file', header
                      elif line.startswith(' '):
                          cs = (' ', '\\')
                          yield 'context', scanwhile(line, lambda l: l.startswith(cs))
                      elif line.startswith(('-', '+')):
                          cs = ('-', '+', '\\')
                          yield 'hunk', scanwhile(line, lambda l: l.startswith(cs))
                      else:
                          m = lines_re.match(line)
                          if m:
                              yield 'range', m.groups()
                          else:
                              yield 'other', line
              def scangitpatch(lr, firstline):
                  """
                  Git patches can emit:
                  - rename a to b
                  - change b
                  - copy a to c
                  - change c
                  We cannot apply this sequence as-is, the renamed 'a' could not be
                  found for it would have been renamed already. And we cannot copy
                  from 'b' instead because 'b' would have been changed already. So
                  we scan the git patch for copy and rename commands so we can
                  perform the copies ahead of time.
                  """
                  pos = 0
                  try:
                      pos = lr.fp.tell()
                      fp = lr.fp
                  except IOError:
                      fp = stringio(lr.fp.read())
                  gitlr = linereader(fp)
                  gitlr.push(firstline)
                  gitpatches = readgitpatch(gitlr)
                  fp.seek(pos)
                  return gitpatches
              def iterhunks(fp):
                  """Read a patch and yield the following events:
                  - ("file", afile, bfile, firsthunk): select a new target file.
                  - ("hunk", hunk): a new hunk is ready to be applied, follows a
                  "file" event.
                  - ("git", gitchanges): current diff is in git format, gitchanges
                  maps filenames to gitpatch records. Unique event.
                  """
                  afile = ""
                  bfile = ""
                  state = None
                  hunknum = 0
                  emitfile = newfile = False
                  gitpatches = None
                  # our states
                  BFILE = 1
                  context = None
                  lr = linereader(fp)
                  for x in iter(lr.readline, ''):
                      if state == BFILE and (
                          (not context and x.startswith('@'))
                          or (context is not False and x.startswith('***************'))
                          or x.startswith('GIT binary patch')):
                          gp = None
                          if (gitpatches and
                              gitpatches[-1].ispatching(afile, bfile)):
                              gp = gitpatches.pop()
                          if x.startswith('GIT binary patch'):
                              h = binhunk(lr, gp.path)
                          else:
                              if context is None and x.startswith('***************'):
                                  context = True
                              h = hunk(x, hunknum + 1, lr, context)
                          hunknum += 1
                          if emitfile:
                              emitfile = False
                              yield 'file', (afile, bfile, h, gp and gp.copy() or None)
                          yield 'hunk', h
                      elif x.startswith('diff --git a/'):
                          m = gitre.match(x.rstrip(' \r\n'))
                          if not m:
                              continue
                          if gitpatches is None:
                              # scan whole input for git metadata
                              gitpatches = scangitpatch(lr, x)
                              yield 'git', [g.copy() for g in gitpatches
                                            if g.op in ('COPY', 'RENAME')]
                              gitpatches.reverse()
                          afile = 'a/' + m.group(1)
                          bfile = 'b/' + m.group(2)
                          while gitpatches and not gitpatches[-1].ispatching(afile, bfile):
                              gp = gitpatches.pop()
                              yield 'file', ('a/' + gp.path, 'b/' + gp.path, None, gp.copy())
                          if not gitpatches:
                              raise PatchError(_('failed to synchronize metadata for "%s"')
                                               % afile[2:])
                          gp = gitpatches[-1]
                          newfile = True
                      elif x.startswith('---'):
                          # check for a unified diff
                          l2 = lr.readline()
                          if not l2.startswith('+++'):
                              lr.push(l2)
                              continue
                          newfile = True
                          context = False
                          afile = parsefilename(x)
                          bfile = parsefilename(l2)
                      elif x.startswith('***'):
                          # check for a context diff
                          l2 = lr.readline()
                          if not l2.startswith('---'):
                              lr.push(l2)
                              continue
                          l3 = lr.readline()
                          lr.push(l3)
                          if not l3.startswith("***************"):
                              lr.push(l2)
                              continue
                          newfile = True
                          context = True
                          afile = parsefilename(x)
                          bfile = parsefilename(l2)
                      if newfile:
                          newfile = False
                          emitfile = True
                          state = BFILE
                          hunknum = 0
                  while gitpatches:
                      gp = gitpatches.pop()
                      yield 'file', ('a/' + gp.path, 'b/' + gp.path, None, gp.copy())
              def applybindelta(binchunk, data):
                  """Apply a binary delta hunk
                  The algorithm used is the algorithm from git's patch-delta.c
                  """
                  def deltahead(binchunk):
                      i = 0
                      for c in pycompat.bytestr(binchunk):
                          i += 1
                          if not (ord(c) & 0x80):
                              return i
                      return i
                  out = ""
                  s = deltahead(binchunk)
                  binchunk = binchunk[s:]
                  s = deltahead(binchunk)
                  binchunk = binchunk[s:]
                  i = 0
                  while i < len(binchunk):
                      cmd = ord(binchunk[i:i + 1])
                      i += 1
                      if (cmd & 0x80):
                          offset = 0
                          size = 0
                          if (cmd & 0x01):
                              offset = ord(binchunk[i:i + 1])
                              i += 1
                          if (cmd & 0x02):
                              offset |= ord(binchunk[i:i + 1]) << 8
                              i += 1
                          if (cmd & 0x04):
                              offset |= ord(binchunk[i:i + 1]) << 16
                              i += 1
                          if (cmd & 0x08):
                              offset |= ord(binchunk[i:i + 1]) << 24
                              i += 1
                          if (cmd & 0x10):
                              size = ord(binchunk[i:i + 1])
                              i += 1
                          if (cmd & 0x20):
                              size |= ord(binchunk[i:i + 1]) << 8
                              i += 1
                          if (cmd & 0x40):
                              size |= ord(binchunk[i:i + 1]) << 16
                              i += 1
                          if size == 0:
                              size = 0x10000
                          offset_end = offset + size
                          out += data[offset:offset_end]
                      elif cmd != 0:
                          offset_end = i + cmd
                          out += binchunk[i:offset_end]
                          i += cmd
                      else:
                          raise PatchError(_('unexpected delta opcode 0'))
                  return out
              def applydiff(ui, fp, backend, store, strip=1, prefix='', eolmode='strict'):
                  """Reads a patch from fp and tries to apply it.
                  Returns 0 for a clean patch, -1 if any rejects were found and 1 if
                  there was any fuzz.
                  If 'eolmode' is 'strict', the patch content and patched file are
                  read in binary mode. Otherwise, line endings are ignored when
                  patching then normalized according to 'eolmode'.
                  """
                  return _applydiff(ui, fp, patchfile, backend, store, strip=strip,
                                    prefix=prefix, eolmode=eolmode)
              def _canonprefix(repo, prefix):
                  if prefix:
                      prefix = pathutil.canonpath(repo.root, repo.getcwd(), prefix)
                      if prefix != '':
                          prefix += '/'
                  return prefix
              def _applydiff(ui, fp, patcher, backend, store, strip=1, prefix='',
                             eolmode='strict'):
                  prefix = _canonprefix(backend.repo, prefix)
                  def pstrip(p):
                      return pathtransform(p, strip - 1, prefix)[1]
                  rejects = 0
                  err = 0
                  current_file = None
                  for state, values in iterhunks(fp):
                      if state == 'hunk':
                          if not current_file:
                              continue
                          ret = current_file.apply(values)
                          if ret > 0:
                              err = 1
                      elif state == 'file':
                          if current_file:
                              rejects += current_file.close()
                              current_file = None
                          afile, bfile, first_hunk, gp = values
                          if gp:
                              gp.path = pstrip(gp.path)
                              if gp.oldpath:
                                  gp.oldpath = pstrip(gp.oldpath)
                          else:
                              gp = makepatchmeta(backend, afile, bfile, first_hunk, strip,
                                                 prefix)
                          if gp.op == 'RENAME':
                              backend.unlink(gp.oldpath)
                          if not first_hunk:
                              if gp.op == 'DELETE':
                                  backend.unlink(gp.path)
                                  continue
                              data, mode = None, None
                              if gp.op in ('RENAME', 'COPY'):
                                  data, mode = store.getfile(gp.oldpath)[:2]
                                  if data is None:
                                      # This means that the old path does not exist
                                      raise PatchError(_("source file '%s' does not exist")
                                                         % gp.oldpath)
                              if gp.mode:
                                  mode = gp.mode
                                  if gp.op == 'ADD':
                                      # Added files without content have no hunk and
                                      # must be created
                                      data = ''
                              if data or mode:
                                  if (gp.op in ('ADD', 'RENAME', 'COPY')
                                      and backend.exists(gp.path)):
                                      raise PatchError(_("cannot create %s: destination "
                                                         "already exists") % gp.path)
                                  backend.setfile(gp.path, data, mode, gp.oldpath)
                              continue
                          try:
                              current_file = patcher(ui, gp, backend, store,
                                                     eolmode=eolmode)
                          except PatchError as inst:
                              ui.warn(str(inst) + '\n')
                              current_file = None
                              rejects += 1
                              continue
                      elif state == 'git':
                          for gp in values:
                              path = pstrip(gp.oldpath)
                              data, mode = backend.getfile(path)
                              if data is None:
                                  # The error ignored here will trigger a getfile()
                                  # error in a place more appropriate for error
                                  # handling, and will not interrupt the patching
                                  # process.
                                  pass
                              else:
                                  store.setfile(path, data, mode)
                      else:
                          raise error.Abort(_('unsupported parser state: %s') % state)
                  if current_file:
                      rejects += current_file.close()
                  if rejects:
                      return -1
                  return err
              def _externalpatch(ui, repo, patcher, patchname, strip, files,
                                 similarity):
                  """use <patcher> to apply <patchname> to the working directory.
                  returns whether patch was applied with fuzz factor."""
                  fuzz = False
                  args = []
                  cwd = repo.root
                  if cwd:
                      args.append('-d %s' % procutil.shellquote(cwd))
                  cmd = ('%s %s -p%d < %s'
                         % (patcher, ' '.join(args), strip, procutil.shellquote(patchname)))
                  ui.debug('Using external patch tool: %s\n' % cmd)
                  fp = procutil.popen(cmd, 'rb')
                  try:
                      for line in util.iterfile(fp):
                          line = line.rstrip()
                          ui.note(line + '\n')
                          if line.startswith('patching file '):
                              pf = util.parsepatchoutput(line)
                              printed_file = False
                              files.add(pf)
                          elif line.find('with fuzz') >= 0:
                              fuzz = True
                              if not printed_file:
                                  ui.warn(pf + '\n')
                                  printed_file = True
                              ui.warn(line + '\n')
                          elif line.find('saving rejects to file') >= 0:
                              ui.warn(line + '\n')
                          elif line.find('FAILED') >= 0:
                              if not printed_file:
                                  ui.warn(pf + '\n')
                                  printed_file = True
                              ui.warn(line + '\n')
                  finally:
                      if files:
                          scmutil.marktouched(repo, files, similarity)
                  code = fp.close()
                  if code:
                      raise PatchError(_("patch command failed: %s") %
                                       procutil.explainexit(code))
                  return fuzz
              def patchbackend(ui, backend, patchobj, strip, prefix, files=None,
                               eolmode='strict'):
                  if files is None:
                      files = set()
                  if eolmode is None:
                      eolmode = ui.config('patch', 'eol')
                  if eolmode.lower() not in eolmodes:
                      raise error.Abort(_('unsupported line endings type: %s') % eolmode)
                  eolmode = eolmode.lower()
                  store = filestore()
                  try:
                      fp = open(patchobj, 'rb')
                  except TypeError:
                      fp = patchobj
                  try:
                      ret = applydiff(ui, fp, backend, store, strip=strip, prefix=prefix,
                                      eolmode=eolmode)
                  finally:
                      if fp != patchobj:
                          fp.close()
                      files.update(backend.close())
                      store.close()
                  if ret < 0:
                      raise PatchError(_('patch failed to apply'))
                  return ret > 0
              def internalpatch(ui, repo, patchobj, strip, prefix='', files=None,
                                eolmode='strict', similarity=0):
                  """use builtin patch to apply <patchobj> to the working directory.
                  returns whether patch was applied with fuzz factor."""
                  backend = workingbackend(ui, repo, similarity)
                  return patchbackend(ui, backend, patchobj, strip, prefix, files, eolmode)
              def patchrepo(ui, repo, ctx, store, patchobj, strip, prefix, files=None,
                            eolmode='strict'):
                  backend = repobackend(ui, repo, ctx, store)
                  return patchbackend(ui, backend, patchobj, strip, prefix, files, eolmode)
              def patch(ui, repo, patchname, strip=1, prefix='', files=None, eolmode='strict',
                        similarity=0):
                  """Apply <patchname> to the working directory.
                  'eolmode' specifies how end of lines should be handled. It can be:
                  - 'strict': inputs are read in binary mode, EOLs are preserved
                  - 'crlf': EOLs are ignored when patching and reset to CRLF
                  - 'lf': EOLs are ignored when patching and reset to LF
                  - None: get it from user settings, default to 'strict'
                  'eolmode' is ignored when using an external patcher program.
                  Returns whether patch was applied with fuzz factor.
                  """
                  patcher = ui.config('ui', 'patch')
                  if files is None:
                      files = set()
                  if patcher:
                      return _externalpatch(ui, repo, patcher, patchname, strip,
                                            files, similarity)
                  return internalpatch(ui, repo, patchname, strip, prefix, files, eolmode,
                                       similarity)
              def changedfiles(ui, repo, patchpath, strip=1, prefix=''):
                  backend = fsbackend(ui, repo.root)
                  prefix = _canonprefix(repo, prefix)
                  with open(patchpath, 'rb') as fp:
                      changed = set()
                      for state, values in iterhunks(fp):
                          if state == 'file':
                              afile, bfile, first_hunk, gp = values
                              if gp:
                                  gp.path = pathtransform(gp.path, strip - 1, prefix)[1]
                                  if gp.oldpath:
                                      gp.oldpath = pathtransform(gp.oldpath, strip - 1,
                                                                 prefix)[1]
                              else:
                                  gp = makepatchmeta(backend, afile, bfile, first_hunk, strip,
                                                     prefix)
                              changed.add(gp.path)
                              if gp.op == 'RENAME':
                                  changed.add(gp.oldpath)
                          elif state not in ('hunk', 'git'):
                              raise error.Abort(_('unsupported parser state: %s') % state)
                      return changed
              class GitDiffRequired(Exception):
                  pass
-             def diffallopts(ui, opts=None, untrusted=False, section='diff'):
-                 '''return diffopts with all features supported and parsed'''
-                 return difffeatureopts(ui, opts=opts, untrusted=untrusted, section=section,
-                                        git=True, whitespace=True, formatchanging=True)
-             diffopts = diffallopts
-             def difffeatureopts(ui, opts=None, untrusted=False, section='diff', git=False,
-                                 whitespace=False, formatchanging=False):
-                 '''return diffopts with only opted-in features parsed
-                 Features:
-                 - git: git-style diffs
-                 - whitespace: whitespace options like ignoreblanklines and ignorews
-                 - formatchanging: options that will likely break or cause correctness issues
-                   with most diff parsers
-                 '''
-                 def get(key, name=None, getter=ui.configbool, forceplain=None):
-                     if opts:
-                         v = opts.get(key)
-                         # diffopts flags are either None-default (which is passed
-                         # through unchanged, so we can identify unset values), or
-                         # some other falsey default (eg --unified, which defaults
-                         # to an empty string). We only want to override the config
-                         # entries from hgrc with command line values if they
-                         # appear to have been set, which is any truthy value,
-                         # True, or False.
-                         if v or isinstance(v, bool):
-                             return v
-                     if forceplain is not None and ui.plain():
-                         return forceplain
-                     return getter(section, name or key, untrusted=untrusted)
-                 # core options, expected to be understood by every diff parser
-                 buildopts = {
-                     'nodates': get('nodates'),
-                     'showfunc': get('show_function', 'showfunc'),
-                     'context': get('unified', getter=ui.config),
+                 }
-                 buildopts['worddiff'] = ui.configbool('experimental', 'worddiff')
-                 buildopts['xdiff'] = ui.configbool('experimental', 'xdiff')
-                 if git:
-                     buildopts['git'] = get('git')
-                     # since this is in the experimental section, we need to call
-                     # ui.configbool directory
-                     buildopts['showsimilarity'] = ui.configbool('experimental',
-                                                                 'extendedheader.similarity')
-                     # need to inspect the ui object instead of using get() since we want to
-                     # test for an int
-                     hconf = ui.config('experimental', 'extendedheader.index')
-                     if hconf is not None:
-                         hlen = None
-                         try:
-                             # the hash config could be an integer (for length of hash) or a
-                             # word (e.g. short, full, none)
-                             hlen = int(hconf)
-                             if hlen < 0 or hlen > 40:
-                                 msg = _("invalid length for extendedheader.index: '%d'\n")
-                                 ui.warn(msg % hlen)
-                         except ValueError:
-                             # default value
-                             if hconf == 'short' or hconf == '':
-                                 hlen = 12
-                             elif hconf == 'full':
-                                 hlen = 40
-                             elif hconf != 'none':
-                                 msg = _("invalid value for extendedheader.index: '%s'\n")
-                                 ui.warn(msg % hconf)
-                         finally:
-                             buildopts['index'] = hlen
-                 if whitespace:
-                     buildopts['ignorews'] = get('ignore_all_space', 'ignorews')
-                     buildopts['ignorewsamount'] = get('ignore_space_change',
-                                                       'ignorewsamount')
-                     buildopts['ignoreblanklines'] = get('ignore_blank_lines',
-                                                         'ignoreblanklines')
-                     buildopts['ignorewseol'] = get('ignore_space_at_eol', 'ignorewseol')
-                 if formatchanging:
-                     buildopts['text'] = opts and opts.get('text')
-                     binary = None if opts is None else opts.get('binary')
-                     buildopts['nobinary'] = (not binary if binary is not None
-                                              else get('nobinary', forceplain=False))
-                     buildopts['noprefix'] = get('noprefix', forceplain=False)
-                 return mdiff.diffopts(**pycompat.strkwargs(buildopts))
+             diffopts = diffutil.diffopts
+             diffallopts = diffutil.diffallopts
+             difffeatureopts = diffutil.difffeatureopts
              def diff(repo, node1=None, node2=None, match=None, changes=None,
                       opts=None, losedatafn=None, prefix='', relroot='', copy=None,
                       hunksfilterfn=None):
                  '''yields diff of changes to files between two nodes, or node and
                  working directory.
                  if node1 is None, use first dirstate parent instead.
                  if node2 is None, compare node1 with working directory.
                  losedatafn(**kwarg) is a callable run when opts.upgrade=True and
                  every time some change cannot be represented with the current
                  patch format. Return False to upgrade to git patch format, True to
                  accept the loss or raise an exception to abort the diff. It is
                  called with the name of current file being diffed as 'fn'. If set
                  to None, patches will always be upgraded to git format when
                  necessary.
                  prefix is a filename prefix that is prepended to all filenames on
                  display (used for subrepos).
                  relroot, if not empty, must be normalized with a trailing /. Any match
                  patterns that fall outside it will be ignored.
                  copy, if not empty, should contain mappings {dst@y: src@x} of copy
                  information.
                  hunksfilterfn, if not None, should be a function taking a filectx and
                  hunks generator that may yield filtered hunks.
                  '''
                  for fctx1, fctx2, hdr, hunks in diffhunks(
                          repo, node1=node1, node2=node2,
                          match=match, changes=changes, opts=opts,
                          losedatafn=losedatafn, prefix=prefix, relroot=relroot, copy=copy,
                  ):
                      if hunksfilterfn is not None:
                          # If the file has been removed, fctx2 is None; but this should
                          # not occur here since we catch removed files early in
                          # logcmdutil.getlinerangerevs() for 'hg log -L'.
                          assert fctx2 is not None, \
                              'fctx2 unexpectly None in diff hunks filtering'
                          hunks = hunksfilterfn(fctx2, hunks)
                      text = ''.join(sum((list(hlines) for hrange, hlines in hunks), []))
                      if hdr and (text or len(hdr) > 1):
                          yield '\n'.join(hdr) + '\n'
                      if text:
                          yield text
              def diffhunks(repo, node1=None, node2=None, match=None, changes=None,
                            opts=None, losedatafn=None, prefix='', relroot='', copy=None):
                  """Yield diff of changes to files in the form of (`header`, `hunks`) tuples
                  where `header` is a list of diff headers and `hunks` is an iterable of
                  (`hunkrange`, `hunklines`) tuples.
                  See diff() for the meaning of parameters.
                  """
                  if opts is None:
                      opts = mdiff.defaultopts
                  if not node1 and not node2:
                      node1 = repo.dirstate.p1()
                  def lrugetfilectx():
                      cache = {}
                      order = collections.deque()
                      def getfilectx(f, ctx):
                          fctx = ctx.filectx(f, filelog=cache.get(f))
                          if f not in cache:
                              if len(cache) > 20:
                                  del cache[order.popleft()]
                              cache[f] = fctx.filelog()
                          else:
                              order.remove(f)
                          order.append(f)
                          return fctx
                      return getfilectx
                  getfilectx = lrugetfilectx()
                  ctx1 = repo[node1]
                  ctx2 = repo[node2]
                  relfiltered = False
                  if relroot != '' and match.always():
                      # as a special case, create a new matcher with just the relroot
                      pats = [relroot]
                      match = scmutil.match(ctx2, pats, default='path')
                      relfiltered = True
                  if not changes:
                      changes = repo.status(ctx1, ctx2, match=match)
                  modified, added, removed = changes[:3]
                  if not modified and not added and not removed:
                      return []
                  if repo.ui.debugflag:
                      hexfunc = hex
                  else:
                      hexfunc = short
                  revs = [hexfunc(node) for node in [ctx1.node(), ctx2.node()] if node]
                  if copy is None:
                      copy = {}
                      if opts.git or opts.upgrade:
                          copy = copies.pathcopies(ctx1, ctx2, match=match)
                  if relroot is not None:
                      if not relfiltered:
                          # XXX this would ideally be done in the matcher, but that is
                          # generally meant to 'or' patterns, not 'and' them. In this case we
                          # need to 'and' all the patterns from the matcher with relroot.
                          def filterrel(l):
                              return [f for f in l if f.startswith(relroot)]
                          modified = filterrel(modified)
                          added = filterrel(added)
                          removed = filterrel(removed)
                          relfiltered = True
                      # filter out copies where either side isn't inside the relative root
                      copy = dict(((dst, src) for (dst, src) in copy.iteritems()
                                   if dst.startswith(relroot)
                                   and src.startswith(relroot)))
                  modifiedset = set(modified)
                  addedset = set(added)
                  removedset = set(removed)
                  for f in modified:
                      if f not in ctx1:
                          # Fix up added, since merged-in additions appear as
                          # modifications during merges
                          modifiedset.remove(f)
                          addedset.add(f)
                  for f in removed:
                      if f not in ctx1:
                          # Merged-in additions that are then removed are reported as removed.
                          # They are not in ctx1, so We don't want to show them in the diff.
                          removedset.remove(f)
                  modified = sorted(modifiedset)
                  added = sorted(addedset)
                  removed = sorted(removedset)
                  for dst, src in list(copy.items()):
                      if src not in ctx1:
                          # Files merged in during a merge and then copied/renamed are
                          # reported as copies. We want to show them in the diff as additions.
                          del copy[dst]
                  prefetchmatch = scmutil.matchfiles(
                      repo, list(modifiedset | addedset | removedset))
                  scmutil.prefetchfiles(repo, [ctx1.rev(), ctx2.rev()], prefetchmatch)
                  def difffn(opts, losedata):
                      return trydiff(repo, revs, ctx1, ctx2, modified, added, removed,
                                     copy, getfilectx, opts, losedata, prefix, relroot)
                  if opts.upgrade and not opts.git:
                      try:
                          def losedata(fn):
                              if not losedatafn or not losedatafn(fn=fn):
                                  raise GitDiffRequired
                          # Buffer the whole output until we are sure it can be generated
                          return list(difffn(opts.copy(git=False), losedata))
                      except GitDiffRequired:
                          return difffn(opts.copy(git=True), None)
                  else:
                      return difffn(opts, None)
              def diffsinglehunk(hunklines):
                  """yield tokens for a list of lines in a single hunk"""
                  for line in hunklines:
                      # chomp
                      chompline = line.rstrip('\n')
                      # highlight tabs and trailing whitespace
                      stripline = chompline.rstrip()
                      if line.startswith('-'):
                          label = 'diff.deleted'
                      elif line.startswith('+'):
                          label = 'diff.inserted'
                      else:
                          raise error.ProgrammingError('unexpected hunk line: %s' % line)
                      for token in tabsplitter.findall(stripline):
                          if token.startswith('\t'):
                              yield (token, 'diff.tab')
                          else:
                              yield (token, label)
                      if chompline != stripline:
                          yield (chompline[len(stripline):], 'diff.trailingwhitespace')
                      if chompline != line:
                          yield (line[len(chompline):], '')
              def diffsinglehunkinline(hunklines):
                  """yield tokens for a list of lines in a single hunk, with inline colors"""
                  # prepare deleted, and inserted content
                  a = ''
                  b = ''
                  for line in hunklines:
                      if line[0] == '-':
                          a += line[1:]
                      elif line[0] == '+':
                          b += line[1:]
                      else:
                          raise error.ProgrammingError('unexpected hunk line: %s' % line)
                  # fast path: if either side is empty, use diffsinglehunk
                  if not a or not b:
                      for t in diffsinglehunk(hunklines):
                          yield t
                      return
                  # re-split the content into words
                  al = wordsplitter.findall(a)
                  bl = wordsplitter.findall(b)
                  # re-arrange the words to lines since the diff algorithm is line-based
                  aln = [s if s == '\n' else s + '\n' for s in al]
                  bln = [s if s == '\n' else s + '\n' for s in bl]
                  an = ''.join(aln)
                  bn = ''.join(bln)
                  # run the diff algorithm, prepare atokens and btokens
                  atokens = []
                  btokens = []
                  blocks = mdiff.allblocks(an, bn, lines1=aln, lines2=bln)
                  for (a1, a2, b1, b2), btype in blocks:
                      changed = btype == '!'
                      for token in mdiff.splitnewlines(''.join(al[a1:a2])):
                          atokens.append((changed, token))
                      for token in mdiff.splitnewlines(''.join(bl[b1:b2])):
                          btokens.append((changed, token))
                  # yield deleted tokens, then inserted ones
                  for prefix, label, tokens in [('-', 'diff.deleted', atokens),
                                                ('+', 'diff.inserted', btokens)]:
                      nextisnewline = True
                      for changed, token in tokens:
                          if nextisnewline:
                              yield (prefix, label)
                              nextisnewline = False
                          # special handling line end
                          isendofline = token.endswith('\n')
                          if isendofline:
                              chomp = token[:-1] # chomp
                              token = chomp.rstrip() # detect spaces at the end
                              endspaces = chomp[len(token):]
                          # scan tabs
                          for maybetab in tabsplitter.findall(token):
                              if '\t' == maybetab[0]:
                                  currentlabel = 'diff.tab'
                              else:
                                  if changed:
                                      currentlabel = label + '.changed'
                                  else:
                                      currentlabel = label + '.unchanged'
                              yield (maybetab, currentlabel)
                          if isendofline:
                              if endspaces:
                                  yield (endspaces, 'diff.trailingwhitespace')
                              yield ('\n', '')
                              nextisnewline = True
              def difflabel(func, *args, **kw):
                  '''yields 2-tuples of (output, label) based on the output of func()'''
                  if kw.get(r'opts') and kw[r'opts'].worddiff:
                      dodiffhunk = diffsinglehunkinline
                  else:
                      dodiffhunk = diffsinglehunk
                  headprefixes = [('diff', 'diff.diffline'),
                                  ('copy', 'diff.extended'),
                                  ('rename', 'diff.extended'),
                                  ('old', 'diff.extended'),
                                  ('new', 'diff.extended'),
                                  ('deleted', 'diff.extended'),
                                  ('index', 'diff.extended'),
                                  ('similarity', 'diff.extended'),
                                  ('---', 'diff.file_a'),
                                  ('+++', 'diff.file_b')]
                  textprefixes = [('@', 'diff.hunk'),
                                  # - and + are handled by diffsinglehunk
                                 ]
                  head = False
                  # buffers a hunk, i.e. adjacent "-", "+" lines without other changes.
                  hunkbuffer = []
                  def consumehunkbuffer():
                      if hunkbuffer:
                          for token in dodiffhunk(hunkbuffer):
                              yield token
                          hunkbuffer[:] = []
                  for chunk in func(*args, **kw):
                      lines = chunk.split('\n')
                      linecount = len(lines)
                      for i, line in enumerate(lines):
                          if head:
                              if line.startswith('@'):
                                  head = False
                          else:
                              if line and not line.startswith((' ', '+', '-', '@', '\\')):
                                  head = True
                          diffline = False
                          if not head and line and line.startswith(('+', '-')):
                              diffline = True
                          prefixes = textprefixes
                          if head:
                              prefixes = headprefixes
                          if diffline:
                              # buffered
                              bufferedline = line
                              if i + 1 < linecount:
                                  bufferedline += "\n"
                              hunkbuffer.append(bufferedline)
                          else:
                              # unbuffered
                              for token in consumehunkbuffer():
                                  yield token
                              stripline = line.rstrip()
                              for prefix, label in prefixes:
                                  if stripline.startswith(prefix):
                                      yield (stripline, label)
                                      if line != stripline:
                                          yield (line[len(stripline):],
                                                 'diff.trailingwhitespace')
                                      break
                              else:
                                  yield (line, '')
                              if i + 1 < linecount:
                                  yield ('\n', '')
                      for token in consumehunkbuffer():
                          yield token
              def diffui(*args, **kw):
                  '''like diff(), but yields 2-tuples of (output, label) for ui.write()'''
                  return difflabel(diff, *args, **kw)
              def _filepairs(modified, added, removed, copy, opts):
                  '''generates tuples (f1, f2, copyop), where f1 is the name of the file
                  before and f2 is the the name after. For added files, f1 will be None,
                  and for removed files, f2 will be None. copyop may be set to None, 'copy'
                  or 'rename' (the latter two only if opts.git is set).'''
                  gone = set()
                  copyto = dict([(v, k) for k, v in copy.items()])
                  addedset, removedset = set(added), set(removed)
                  for f in sorted(modified + added + removed):
                      copyop = None
                      f1, f2 = f, f
                      if f in addedset:
                          f1 = None
                          if f in copy:
                              if opts.git:
                                  f1 = copy[f]
                                  if f1 in removedset and f1 not in gone:
                                      copyop = 'rename'
                                      gone.add(f1)
                                  else:
                                      copyop = 'copy'
                      elif f in removedset:
                          f2 = None
                          if opts.git:
                              # have we already reported a copy above?
                              if (f in copyto and copyto[f] in addedset
                                  and copy[copyto[f]] == f):
                                  continue
                      yield f1, f2, copyop
              def trydiff(repo, revs, ctx1, ctx2, modified, added, removed,
                          copy, getfilectx, opts, losedatafn, prefix, relroot):
                  '''given input data, generate a diff and yield it in blocks
                  If generating a diff would lose data like flags or binary data and
                  losedatafn is not None, it will be called.
                  relroot is removed and prefix is added to every path in the diff output.
                  If relroot is not empty, this function expects every path in modified,
                  added, removed and copy to start with it.'''
                  def gitindex(text):
                      if not text:
                          text = ""
                      l = len(text)
                      s = hashlib.sha1('blob %d\0' % l)
                      s.update(text)
                      return hex(s.digest())
                  if opts.noprefix:
                      aprefix = bprefix = ''
                  else:
                      aprefix = 'a/'
                      bprefix = 'b/'
                  def diffline(f, revs):
                      revinfo = ' '.join(["-r %s" % rev for rev in revs])
                      return 'diff %s %s' % (revinfo, f)
                  def isempty(fctx):
                      return fctx is None or fctx.size() == 0
                  date1 = dateutil.datestr(ctx1.date())
                  date2 = dateutil.datestr(ctx2.date())
                  gitmode = {'l': '120000', 'x': '100755', '': '100644'}
                  if relroot != '' and (repo.ui.configbool('devel', 'all-warnings')
                                        or repo.ui.configbool('devel', 'check-relroot')):
                      for f in modified + added + removed + list(copy) + list(copy.values()):
                          if f is not None and not f.startswith(relroot):
                              raise AssertionError(
                                  "file %s doesn't start with relroot %s" % (f, relroot))
                  for f1, f2, copyop in _filepairs(modified, added, removed, copy, opts):
                      content1 = None
                      content2 = None
                      fctx1 = None
                      fctx2 = None
                      flag1 = None
                      flag2 = None
                      if f1:
                          fctx1 = getfilectx(f1, ctx1)
                          if opts.git or losedatafn:
                              flag1 = ctx1.flags(f1)
                      if f2:
                          fctx2 = getfilectx(f2, ctx2)
                          if opts.git or losedatafn:
                              flag2 = ctx2.flags(f2)
                      # if binary is True, output "summary" or "base85", but not "text diff"
                      if opts.text:
                          binary = False
                      else:
                          binary = any(f.isbinary() for f in [fctx1, fctx2] if f is not None)
                      if losedatafn and not opts.git:
                          if (binary or
                              # copy/rename
                              f2 in copy or
                              # empty file creation
                              (not f1 and isempty(fctx2)) or
                              # empty file deletion
                              (isempty(fctx1) and not f2) or
                              # create with flags
                              (not f1 and flag2) or
                              # change flags
                              (f1 and f2 and flag1 != flag2)):
                              losedatafn(f2 or f1)
                      path1 = f1 or f2
                      path2 = f2 or f1
                      path1 = posixpath.join(prefix, path1[len(relroot):])
                      path2 = posixpath.join(prefix, path2[len(relroot):])
                      header = []
                      if opts.git:
                          header.append('diff --git %s%s %s%s' %
                                        (aprefix, path1, bprefix, path2))
                          if not f1: # added
                              header.append('new file mode %s' % gitmode[flag2])
                          elif not f2: # removed
                              header.append('deleted file mode %s' % gitmode[flag1])
                          else:  # modified/copied/renamed
                              mode1, mode2 = gitmode[flag1], gitmode[flag2]
                              if mode1 != mode2:
                                  header.append('old mode %s' % mode1)
                                  header.append('new mode %s' % mode2)
                              if copyop is not None:
                                  if opts.showsimilarity:
                                      sim = similar.score(ctx1[path1], ctx2[path2]) * 100
                                      header.append('similarity index %d%%' % sim)
                                  header.append('%s from %s' % (copyop, path1))
                                  header.append('%s to %s' % (copyop, path2))
                      elif revs and not repo.ui.quiet:
                          header.append(diffline(path1, revs))
                      #  fctx.is  | diffopts                | what to   | is fctx.data()
                      #  binary() | text nobinary git index | output?   | outputted?
                      # ------------------------------------|----------------------------
                      #  yes      | no   no       no  *     | summary   | no
                      #  yes      | no   no       yes *     | base85    | yes
                      #  yes      | no   yes      no  *     | summary   | no
                      #  yes      | no   yes      yes 0     | summary   | no
                      #  yes      | no   yes      yes >0    | summary   | semi [1]
                      #  yes      | yes  *        *   *     | text diff | yes
                      #  no       | *    *        *   *     | text diff | yes
                      # [1]: hash(fctx.data()) is outputted. so fctx.data() cannot be faked
                      if binary and (not opts.git or (opts.git and opts.nobinary and not
                                                      opts.index)):
                          # fast path: no binary content will be displayed, content1 and
                          # content2 are only used for equivalent test. cmp() could have a
                          # fast path.
                          if fctx1 is not None:
                              content1 = b'\0'
                          if fctx2 is not None:
                              if fctx1 is not None and not fctx1.cmp(fctx2):
                                  content2 = b'\0' # not different
                              else:
                                  content2 = b'\0\0'
                      else:
                          # normal path: load contents
                          if fctx1 is not None:
                              content1 = fctx1.data()
                          if fctx2 is not None:
                              content2 = fctx2.data()
                      if binary and opts.git and not opts.nobinary:
                          text = mdiff.b85diff(content1, content2)
                          if text:
                              header.append('index %s..%s' %
                                            (gitindex(content1), gitindex(content2)))
                          hunks = (None, [text]),
                      else:
                          if opts.git and opts.index > 0:
                              flag = flag1
                              if flag is None:
                                  flag = flag2
                              header.append('index %s..%s %s' %
                                            (gitindex(content1)[0:opts.index],
                                             gitindex(content2)[0:opts.index],
                                             gitmode[flag]))
                          uheaders, hunks = mdiff.unidiff(content1, date1,
                                                          content2, date2,
                                                          path1, path2,
                                                          binary=binary, opts=opts)
                          header.extend(uheaders)
                      yield fctx1, fctx2, header, hunks
              def diffstatsum(stats):
                  maxfile, maxtotal, addtotal, removetotal, binary = 0, 0, 0, 0, False
                  for f, a, r, b in stats:
                      maxfile = max(maxfile, encoding.colwidth(f))
                      maxtotal = max(maxtotal, a + r)
                      addtotal += a
                      removetotal += r
                      binary = binary or b
                  return maxfile, maxtotal, addtotal, removetotal, binary
              def diffstatdata(lines):
                  diffre = re.compile('^diff .*-r [a-z0-9]+\s(.*)$')
                  results = []
                  filename, adds, removes, isbinary = None, 0, 0, False
                  def addresult():
                      if filename:
                          results.append((filename, adds, removes, isbinary))
                  # inheader is used to track if a line is in the
                  # header portion of the diff.  This helps properly account
                  # for lines that start with '--' or '++'
                  inheader = False
                  for line in lines:
                      if line.startswith('diff'):
                          addresult()
                          # starting a new file diff
                          # set numbers to 0 and reset inheader
                          inheader = True
                          adds, removes, isbinary = 0, 0, False
                          if line.startswith('diff --git a/'):
                              filename = gitre.search(line).group(2)
                          elif line.startswith('diff -r'):
                              # format: "diff -r ... -r ... filename"
                              filename = diffre.search(line).group(1)
                      elif line.startswith('@@'):
                          inheader = False
                      elif line.startswith('+') and not inheader:
                          adds += 1
                      elif line.startswith('-') and not inheader:
                          removes += 1
                      elif (line.startswith('GIT binary patch') or
                            line.startswith('Binary file')):
                          isbinary = True
                  addresult()
                  return results
              def diffstat(lines, width=80):
                  output = []
                  stats = diffstatdata(lines)
                  maxname, maxtotal, totaladds, totalremoves, hasbinary = diffstatsum(stats)
                  countwidth = len(str(maxtotal))
                  if hasbinary and countwidth < 3:
                      countwidth = 3
                  graphwidth = width - countwidth - maxname - 6
                  if graphwidth < 10:
                      graphwidth = 10
                  def scale(i):
                      if maxtotal <= graphwidth:
                          return i
                      # If diffstat runs out of room it doesn't print anything,
                      # which isn't very useful, so always print at least one + or -
                      # if there were at least some changes.
                      return max(i * graphwidth // maxtotal, int(bool(i)))
                  for filename, adds, removes, isbinary in stats:
                      if isbinary:
                          count = 'Bin'
                      else:
                          count = '%d' % (adds + removes)
                      pluses = '+' * scale(adds)
                      minuses = '-' * scale(removes)
                      output.append(' %s%s |  %*s %s%s\n' %
                                    (filename, ' ' * (maxname - encoding.colwidth(filename)),
                                     countwidth, count, pluses, minuses))
                  if stats:
                      output.append(_(' %d files changed, %d insertions(+), '
                                      '%d deletions(-)\n')
                                    % (len(stats), totaladds, totalremoves))
                  return ''.join(output)
              def diffstatui(*args, **kw):
                  '''like diffstat(), but yields 2-tuples of (output, label) for
                  ui.write()
                  '''
                  for line in diffstat(*args, **kw).splitlines():
                      if line and line[-1] in '+-':
                          name, graph = line.rsplit(' ', 1)
                          yield (name + ' ', '')
                          m = re.search(br'\++', graph)
                          if m:
                              yield (m.group(0), 'diffstat.inserted')
                          m = re.search(br'-+', graph)
                          if m:
                              yield (m.group(0), 'diffstat.deleted')
                      else:
                          yield (line, '')
                      yield ('\n', '')

mercurial/utils/diffutil.py mercurial/patch.py

0 copied +8 -2852

This diff has been collapsed as it changes many lines, (2860 lines changed) Show them Hide them
			@@ -1,2951 +1,107
	1		# patch.py - patch file parsing routines
		1	# diffutil.py - utility functions related to diff and patch
	2	2	#
	3	3	# Copyright 2006 Brendan Cully <brendan@kublai.com>
	4	4	# Copyright 2007 Chris Mason <chris.mason@oracle.com>
		5	# Copyright 2018 Octobus <octobus@octobus.net>
	5	6	#
	6	7	# This software may be used and distributed according to the terms of the
	7	8	# GNU General Public License version 2 or any later version.
	8	9
	9		from __future__ import absolute_import, ~~print_function~~
	10
	11		import collections
	12		import contextlib
	13		import copy
	14		import email
	15		import errno
	16		import hashlib
	17		import os
	18		import posixpath
	19		import re
	20		import shutil
	21		import zlib
	22
	23		from .i18n import _
	24		from .node import (
	25		hex,
	26		short,
	27		)
	28		from . import (
	29		copies,
	30		diffhelper,
	31		encoding,
	32		error,
	33		mail,
	34		mdiff,
	35		pathutil,
	36		pycompat,
	37		scmutil,
	38		similar,
	39		util,
	40		vfs as vfsmod,
	41		)
	42		from .utils import (
	43		dateutil,
	44		procutil,
	45		stringutil,
	46		)
	47
	48		stringio = util.stringio
	49
	50		gitre = re.compile(br'diff --git a/(.) b/(.)')
	51		tabsplitter = re.compile(br'(\t+\|[^\t]+)')
	52		wordsplitter = re.compile(br'(\t+\| +\|[a-zA-Z0-9_\x80-\xff]+\|'
	53		b'[^ \ta-zA-Z0-9_\x80-\xff])')
	54
	55		PatchError = error.PatchError
	56
	57		# public functions
	58
	59		def split(stream):
	60		'''return an iterator of individual patches from a stream'''
	61		def isheader(line, inheader):
	62		if inheader and line.startswith((' ', '\t')):
	63		# continuation
	64		return True
	65		if line.startswith((' ', '-', '+')):
	66		# diff line - don't check for header pattern in there
	67		return False
	68		l = line.split(': ', 1)
	69		return len(l) == 2 and ' ' not in l[0]
	70
	71		def chunk(lines):
	72		return stringio(''.join(lines))
	73
	74		def hgsplit(stream, cur):
	75		inheader = True
	76
	77		for line in stream:
	78		if not line.strip():
	79		inheader = False
	80		if not inheader and line.startswith('# HG changeset patch'):
	81		yield chunk(cur)
	82		cur = []
	83		inheader = True
	84
	85		cur.append(line)
	86
	87		if cur:
	88		yield chunk(cur)
	89
	90		def mboxsplit(stream, cur):
	91		for line in stream:
	92		if line.startswith('From '):
	93		for c in split(chunk(cur[1:])):
	94		yield c
	95		cur = []
	96
	97		cur.append(line)
	98
	99		if cur:
	100		for c in split(chunk(cur[1:])):
	101		yield c
	102
	103		def mimesplit(stream, cur):
	104		def msgfp(m):
	105		fp = stringio()
	106		g = email.Generator.Generator(fp, mangle_from_=False)
	107		g.flatten(m)
	108		fp.seek(0)
	109		return fp
	110
	111		for line in stream:
	112		cur.append(line)
	113		c = chunk(cur)
	114
	115		m = mail.parse(c)
	116		if not m.is_multipart():
	117		yield msgfp(m)
	118		else:
	119		ok_types = ('text/plain', 'text/x-diff', 'text/x-patch')
	120		for part in m.walk():
	121		ct = part.get_content_type()
	122		if ct not in ok_types:
	123		continue
	124		yield msgfp(part)
	125
	126		def headersplit(stream, cur):
	127		inheader = False
	128
	129		for line in stream:
	130		if not inheader and isheader(line, inheader):
	131		yield chunk(cur)
	132		cur = []
	133		inheader = True
	134		if inheader and not isheader(line, inheader):
	135		inheader = False
	136
	137		cur.append(line)
	138
	139		if cur:
	140		yield chunk(cur)
	141
	142		def remainder(cur):
	143		yield chunk(cur)
	144
	145		class fiter(object):
	146		def __init__(self, fp):
	147		self.fp = fp
	148
	149		def __iter__(self):
	150		return self
	151
	152		def next(self):
	153		l = self.fp.readline()
	154		if not l:
	155		raise StopIteration
	156		return l
	157
	158		__next__ = next
	159
	160		inheader = False
	161		cur = []
	162
	163		mimeheaders = ['content-type']
	164
	165		if not util.safehasattr(stream, 'next'):
	166		# http responses, for example, have readline but not next
	167		stream = fiter(stream)
	168
	169		for line in stream:
	170		cur.append(line)
	171		if line.startswith('# HG changeset patch'):
	172		return hgsplit(stream, cur)
	173		elif line.startswith('From '):
	174		return mboxsplit(stream, cur)
	175		elif isheader(line, inheader):
	176		inheader = True
	177		if line.split(':', 1)[0].lower() in mimeheaders:
	178		# let email parser handle this
	179		return mimesplit(stream, cur)
	180		elif line.startswith('--- ') and inheader:
	181		# No evil headers seen by diff start, split by hand
	182		return headersplit(stream, cur)
	183		# Not enough info, keep reading
	184
	185		# if we are here, we have a very plain patch
	186		return remainder(cur)
	187
	188		## Some facility for extensible patch parsing:
	189		# list of pairs ("header to match", "data key")
	190		patchheadermap = [('Date', 'date'),
	191		('Branch', 'branch'),
	192		('Node ID', 'nodeid'),
	193		]
	194
	195		@contextlib.contextmanager
	196		def extract(ui, fileobj):
	197		'''extract patch from data read from fileobj.
	198
	199		patch can be a normal patch or contained in an email message.
	200
	201		return a dictionary. Standard keys are:
	202		- filename,
	203		- message,
	204		- user,
	205		- date,
	206		- branch,
	207		- node,
	208		- p1,
	209		- p2.
	210		Any item can be missing from the dictionary. If filename is missing,
	211		fileobj did not contain a patch. Caller must unlink filename when done.'''
	212
	213		fd, tmpname = pycompat.mkstemp(prefix='hg-patch-')
	214		tmpfp = os.fdopen(fd, r'wb')
	215		try:
	216		yield _extract(ui, fileobj, tmpname, tmpfp)
	217		finally:
	218		tmpfp.close()
	219		os.unlink(tmpname)
	220
	221		def _extract(ui, fileobj, tmpname, tmpfp):
	222
	223		# attempt to detect the start of a patch
	224		# (this heuristic is borrowed from quilt)
	225		diffre = re.compile(br'^(?:Index:[ \t]\|diff[ \t]-\|RCS file: \|'
	226		br'retrieving revision [0-9]+(\.[0-9]+)*$\|'
	227		br'---[ \t].*?^\+\+\+[ \t]\|'
	228		br'\\\[ \t].?^---[ \t])',
	229		re.MULTILINE \| re.DOTALL)
	230
	231		data = {}
	232
	233		msg = mail.parse(fileobj)
	234
	235		subject = msg[r'Subject'] and mail.headdecode(msg[r'Subject'])
	236		data['user'] = msg[r'From'] and mail.headdecode(msg[r'From'])
	237		if not subject and not data['user']:
	238		# Not an email, restore parsed headers if any
	239		subject = '\n'.join(': '.join(map(encoding.strtolocal, h))
	240		for h in msg.items()) + '\n'
	241
	242		# should try to parse msg['Date']
	243		parents = []
	244
	245		if subject:
	246		if subject.startswith('[PATCH'):
	247		pend = subject.find(']')
	248		if pend >= 0:
	249		subject = subject[pend + 1:].lstrip()
	250		subject = re.sub(br'\n[ \t]+', ' ', subject)
	251		ui.debug('Subject: %s\n' % subject)
	252		if data['user']:
	253		ui.debug('From: %s\n' % data['user'])
	254		diffs_seen = 0
	255		ok_types = ('text/plain', 'text/x-diff', 'text/x-patch')
	256		message = ''
	257		for part in msg.walk():
	258		content_type = pycompat.bytestr(part.get_content_type())
	259		ui.debug('Content-Type: %s\n' % content_type)
	260		if content_type not in ok_types:
	261		continue
	262		payload = part.get_payload(decode=True)
	263		m = diffre.search(payload)
	264		if m:
	265		hgpatch = False
	266		hgpatchheader = False
	267		ignoretext = False
	268
	269		ui.debug('found patch at byte %d\n' % m.start(0))
	270		diffs_seen += 1
	271		cfp = stringio()
	272		for line in payload[:m.start(0)].splitlines():
	273		if line.startswith('# HG changeset patch') and not hgpatch:
	274		ui.debug('patch generated by hg export\n')
	275		hgpatch = True
	276		hgpatchheader = True
	277		# drop earlier commit message content
	278		cfp.seek(0)
	279		cfp.truncate()
	280		subject = None
	281		elif hgpatchheader:
	282		if line.startswith('# User '):
	283		data['user'] = line[7:]
	284		ui.debug('From: %s\n' % data['user'])
	285		elif line.startswith("# Parent "):
	286		parents.append(line[9:].lstrip())
	287		elif line.startswith("# "):
	288		for header, key in patchheadermap:
	289		prefix = '# %s ' % header
	290		if line.startswith(prefix):
	291		data[key] = line[len(prefix):]
	292		else:
	293		hgpatchheader = False
	294		elif line == '---':
	295		ignoretext = True
	296		if not hgpatchheader and not ignoretext:
	297		cfp.write(line)
	298		cfp.write('\n')
	299		message = cfp.getvalue()
	300		if tmpfp:
	301		tmpfp.write(payload)
	302		if not payload.endswith('\n'):
	303		tmpfp.write('\n')
	304		elif not diffs_seen and message and content_type == 'text/plain':
	305		message += '\n' + payload
	306
	307		if subject and not message.startswith(subject):
	308		message = '%s\n%s' % (subject, message)
	309		data['message'] = message
	310		tmpfp.close()
	311		if parents:
	312		data['p1'] = parents.pop(0)
	313		if parents:
	314		data['p2'] = parents.pop(0)
	315
	316		if diffs_seen:
	317		data['filename'] = tmpname
	318
	319		return data
	320
	321		class patchmeta(object):
	322		"""Patched file metadata
	323
	324		'op' is the performed operation within ADD, DELETE, RENAME, MODIFY
	325		or COPY. 'path' is patched file path. 'oldpath' is set to the
	326		origin file when 'op' is either COPY or RENAME, None otherwise. If
	327		file mode is changed, 'mode' is a tuple (islink, isexec) where
	328		'islink' is True if the file is a symlink and 'isexec' is True if
	329		the file is executable. Otherwise, 'mode' is None.
	330		"""
	331		def __init__(self, path):
	332		self.path = path
	333		self.oldpath = None
	334		self.mode = None
	335		self.op = 'MODIFY'
	336		self.binary = False
	337
	338		def setmode(self, mode):
	339		islink = mode & 0o20000
	340		isexec = mode & 0o100
	341		self.mode = (islink, isexec)
	342
	343		def copy(self):
	344		other = patchmeta(self.path)
	345		other.oldpath = self.oldpath
	346		other.mode = self.mode
	347		other.op = self.op
	348		other.binary = self.binary
	349		return other
	350
	351		def _ispatchinga(self, afile):
	352		if afile == '/dev/null':
	353		return self.op == 'ADD'
	354		return afile == 'a/' + (self.oldpath or self.path)
	355
	356		def _ispatchingb(self, bfile):
	357		if bfile == '/dev/null':
	358		return self.op == 'DELETE'
	359		return bfile == 'b/' + self.path
	360
	361		def ispatching(self, afile, bfile):
	362		return self._ispatchinga(afile) and self._ispatchingb(bfile)
	363
	364		def __repr__(self):
	365		return "<patchmeta %s %r>" % (self.op, self.path)
	366
	367		def readgitpatch(lr):
	368		"""extract git-style metadata about patches from <patchname>"""
	369
	370		# Filter patch for git information
	371		gp = None
	372		gitpatches = []
	373		for line in lr:
	374		line = line.rstrip(' \r\n')
	375		if line.startswith('diff --git a/'):
	376		m = gitre.match(line)
	377		if m:
	378		if gp:
	379		gitpatches.append(gp)
	380		dst = m.group(2)
	381		gp = patchmeta(dst)
	382		elif gp:
	383		if line.startswith('--- '):
	384		gitpatches.append(gp)
	385		gp = None
	386		continue
	387		if line.startswith('rename from '):
	388		gp.op = 'RENAME'
	389		gp.oldpath = line[12:]
	390		elif line.startswith('rename to '):
	391		gp.path = line[10:]
	392		elif line.startswith('copy from '):
	393		gp.op = 'COPY'
	394		gp.oldpath = line[10:]
	395		elif line.startswith('copy to '):
	396		gp.path = line[8:]
	397		elif line.startswith('deleted file'):
	398		gp.op = 'DELETE'
	399		elif line.startswith('new file mode '):
	400		gp.op = 'ADD'
	401		gp.setmode(int(line[-6:], 8))
	402		elif line.startswith('new mode '):
	403		gp.setmode(int(line[-6:], 8))
	404		elif line.startswith('GIT binary patch'):
	405		gp.binary = True
	406		if gp:
	407		gitpatches.append(gp)
	408
	409		return gitpatches
	410
	411		class linereader(object):
	412		# simple class to allow pushing lines back into the input stream
	413		def __init__(self, fp):
	414		self.fp = fp
	415		self.buf = []
	416
	417		def push(self, line):
	418		if line is not None:
	419		self.buf.append(line)
	420
	421		def readline(self):
	422		if self.buf:
	423		l = self.buf[0]
	424		del self.buf[0]
	425		return l
	426		return self.fp.readline()
	427
	428		def __iter__(self):
	429		return iter(self.readline, '')
	430
	431		class abstractbackend(object):
	432		def __init__(self, ui):
	433		self.ui = ui
	434
	435		def getfile(self, fname):
	436		"""Return target file data and flags as a (data, (islink,
	437		isexec)) tuple. Data is None if file is missing/deleted.
	438		"""
	439		raise NotImplementedError
	440
	441		def setfile(self, fname, data, mode, copysource):
	442		"""Write data to target file fname and set its mode. mode is a
	443		(islink, isexec) tuple. If data is None, the file content should
	444		be left unchanged. If the file is modified after being copied,
	445		copysource is set to the original file name.
	446		"""
	447		raise NotImplementedError
	448
	449		def unlink(self, fname):
	450		"""Unlink target file."""
	451		raise NotImplementedError
	452
	453		def writerej(self, fname, failed, total, lines):
	454		"""Write rejected lines for fname. total is the number of hunks
	455		which failed to apply and total the total number of hunks for this
	456		files.
	457		"""
	458
	459		def exists(self, fname):
	460		raise NotImplementedError
	461
	462		def close(self):
	463		raise NotImplementedError
	464
	465		class fsbackend(abstractbackend):
	466		def __init__(self, ui, basedir):
	467		super(fsbackend, self).__init__(ui)
	468		self.opener = vfsmod.vfs(basedir)
	469
	470		def getfile(self, fname):
	471		if self.opener.islink(fname):
	472		return (self.opener.readlink(fname), (True, False))
	473
	474		isexec = False
	475		try:
	476		isexec = self.opener.lstat(fname).st_mode & 0o100 != 0
	477		except OSError as e:
	478		if e.errno != errno.ENOENT:
	479		raise
	480		try:
	481		return (self.opener.read(fname), (False, isexec))
	482		except IOError as e:
	483		if e.errno != errno.ENOENT:
	484		raise
	485		return None, None
	486
	487		def setfile(self, fname, data, mode, copysource):
	488		islink, isexec = mode
	489		if data is None:
	490		self.opener.setflags(fname, islink, isexec)
	491		return
	492		if islink:
	493		self.opener.symlink(data, fname)
	494		else:
	495		self.opener.write(fname, data)
	496		if isexec:
	497		self.opener.setflags(fname, False, True)
	498
	499		def unlink(self, fname):
	500		rmdir = self.ui.configbool('experimental', 'removeemptydirs')
	501		self.opener.unlinkpath(fname, ignoremissing=True, rmdir=rmdir)
	502
	503		def writerej(self, fname, failed, total, lines):
	504		fname = fname + ".rej"
	505		self.ui.warn(
	506		_("%d out of %d hunks FAILED -- saving rejects to file %s\n") %
	507		(failed, total, fname))
	508		fp = self.opener(fname, 'w')
	509		fp.writelines(lines)
	510		fp.close()
	511
	512		def exists(self, fname):
	513		return self.opener.lexists(fname)
	514
	515		class workingbackend(fsbackend):
	516		def __init__(self, ui, repo, similarity):
	517		super(workingbackend, self).__init__(ui, repo.root)
	518		self.repo = repo
	519		self.similarity = similarity
	520		self.removed = set()
	521		self.changed = set()
	522		self.copied = []
	523
	524		def _checkknown(self, fname):
	525		if self.repo.dirstate[fname] == '?' and self.exists(fname):
	526		raise PatchError(_('cannot patch %s: file is not tracked') % fname)
	527
	528		def setfile(self, fname, data, mode, copysource):
	529		self._checkknown(fname)
	530		super(workingbackend, self).setfile(fname, data, mode, copysource)
	531		if copysource is not None:
	532		self.copied.append((copysource, fname))
	533		self.changed.add(fname)
	534
	535		def unlink(self, fname):
	536		self._checkknown(fname)
	537		super(workingbackend, self).unlink(fname)
	538		self.removed.add(fname)
	539		self.changed.add(fname)
		10	from __future__ import absolute_import
	540	11
	541		def close(self):
	542		wctx = self.repo[None]
	543		changed = set(self.changed)
	544		for src, dst in self.copied:
	545		scmutil.dirstatecopy(self.ui, self.repo, wctx, src, dst)
	546		if self.removed:
	547		wctx.forget(sorted(self.removed))
	548		for f in self.removed:
	549		if f not in self.repo.dirstate:
	550		# File was deleted and no longer belongs to the
	551		# dirstate, it was probably marked added then
	552		# deleted, and should not be considered by
	553		# marktouched().
	554		changed.discard(f)
	555		if changed:
	556		scmutil.marktouched(self.repo, changed, self.similarity)
	557		return sorted(self.changed)
	558
	559		class filestore(object):
	560		def __init__(self, maxsize=None):
	561		self.opener = None
	562		self.files = {}
	563		self.created = 0
	564		self.maxsize = maxsize
	565		if self.maxsize is None:
	566		self.maxsize = 4(2*20)
	567		self.size = 0
	568		self.data = {}
	569
	570		def setfile(self, fname, data, mode, copied=None):
	571		if self.maxsize < 0 or (len(data) + self.size) <= self.maxsize:
	572		self.data[fname] = (data, mode, copied)
	573		self.size += len(data)
	574		else:
	575		if self.opener is None:
	576		root = pycompat.mkdtemp(prefix='hg-patch-')
	577		self.opener = vfsmod.vfs(root)
	578		# Avoid filename issues with these simple names
	579		fn = '%d' % self.created
	580		self.opener.write(fn, data)
	581		self.created += 1
	582		self.files[fname] = (fn, mode, copied)
	583
	584		def getfile(self, fname):
	585		if fname in self.data:
	586		return self.data[fname]
	587		if not self.opener or fname not in self.files:
	588		return None, None, None
	589		fn, mode, copied = self.files[fname]
	590		return self.opener.read(fn), mode, copied
	591
	592		def close(self):
	593		if self.opener:
	594		shutil.rmtree(self.opener.base)
	595
	596		class repobackend(abstractbackend):
	597		def __init__(self, ui, repo, ctx, store):
	598		super(repobackend, self).__init__(ui)
	599		self.repo = repo
	600		self.ctx = ctx
	601		self.store = store
	602		self.changed = set()
	603		self.removed = set()
	604		self.copied = {}
	605
	606		def _checkknown(self, fname):
	607		if fname not in self.ctx:
	608		raise PatchError(_('cannot patch %s: file is not tracked') % fname)
	609
	610		def getfile(self, fname):
	611		try:
	612		fctx = self.ctx[fname]
	613		except error.LookupError:
	614		return None, None
	615		flags = fctx.flags()
	616		return fctx.data(), ('l' in flags, 'x' in flags)
	617
	618		def setfile(self, fname, data, mode, copysource):
	619		if copysource:
	620		self._checkknown(copysource)
	621		if data is None:
	622		data = self.ctx[fname].data()
	623		self.store.setfile(fname, data, mode, copysource)
	624		self.changed.add(fname)
	625		if copysource:
	626		self.copied[fname] = copysource
	627
	628		def unlink(self, fname):
	629		self._checkknown(fname)
	630		self.removed.add(fname)
	631
	632		def exists(self, fname):
	633		return fname in self.ctx
	634
	635		def close(self):
	636		return self.changed \| self.removed
	637
	638		# @@ -start,len +start,len @@ or @@ -start +start @@ if len is 1
	639		unidesc = re.compile('@@ -(\d+)(?:,(\d+))? \+(\d+)(?:,(\d+))? @@')
	640		contextdesc = re.compile('(?:---\|\\\) (\d+)(?:,(\d+))? (?:---\|\\\)')
	641		eolmodes = ['strict', 'crlf', 'lf', 'auto']
	642
	643		class patchfile(object):
	644		def __init__(self, ui, gp, backend, store, eolmode='strict'):
	645		self.fname = gp.path
	646		self.eolmode = eolmode
	647		self.eol = None
	648		self.backend = backend
	649		self.ui = ui
	650		self.lines = []
	651		self.exists = False
	652		self.missing = True
	653		self.mode = gp.mode
	654		self.copysource = gp.oldpath
	655		self.create = gp.op in ('ADD', 'COPY', 'RENAME')
	656		self.remove = gp.op == 'DELETE'
	657		if self.copysource is None:
	658		data, mode = backend.getfile(self.fname)
	659		else:
	660		data, mode = store.getfile(self.copysource)[:2]
	661		if data is not None:
	662		self.exists = self.copysource is None or backend.exists(self.fname)
	663		self.missing = False
	664		if data:
	665		self.lines = mdiff.splitnewlines(data)
	666		if self.mode is None:
	667		self.mode = mode
	668		if self.lines:
	669		# Normalize line endings
	670		if self.lines[0].endswith('\r\n'):
	671		self.eol = '\r\n'
	672		elif self.lines[0].endswith('\n'):
	673		self.eol = '\n'
	674		if eolmode != 'strict':
	675		nlines = []
	676		for l in self.lines:
	677		if l.endswith('\r\n'):
	678		l = l[:-2] + '\n'
	679		nlines.append(l)
	680		self.lines = nlines
	681		else:
	682		if self.create:
	683		self.missing = False
	684		if self.mode is None:
	685		self.mode = (False, False)
	686		if self.missing:
	687		self.ui.warn(_("unable to find '%s' for patching\n") % self.fname)
	688		self.ui.warn(_("(use '--prefix' to apply patch relative to the "
	689		"current directory)\n"))
	690
	691		self.hash = {}
	692		self.dirty = 0
	693		self.offset = 0
	694		self.skew = 0
	695		self.rej = []
	696		self.fileprinted = False
	697		self.printfile(False)
	698		self.hunks = 0
	699
	700		def writelines(self, fname, lines, mode):
	701		if self.eolmode == 'auto':
	702		eol = self.eol
	703		elif self.eolmode == 'crlf':
	704		eol = '\r\n'
	705		else:
	706		eol = '\n'
	707
	708		if self.eolmode != 'strict' and eol and eol != '\n':
	709		rawlines = []
	710		for l in lines:
	711		if l and l.endswith('\n'):
	712		l = l[:-1] + eol
	713		rawlines.append(l)
	714		lines = rawlines
	715
	716		self.backend.setfile(fname, ''.join(lines), mode, self.copysource)
	717
	718		def printfile(self, warn):
	719		if self.fileprinted:
	720		return
	721		if warn or self.ui.verbose:
	722		self.fileprinted = True
	723		s = _("patching file %s\n") % self.fname
	724		if warn:
	725		self.ui.warn(s)
	726		else:
	727		self.ui.note(s)
	728
	729
	730		def findlines(self, l, linenum):
	731		# looks through the hash and finds candidate lines. The
	732		# result is a list of line numbers sorted based on distance
	733		# from linenum
	734
	735		cand = self.hash.get(l, [])
	736		if len(cand) > 1:
	737		# resort our list of potentials forward then back.
	738		cand.sort(key=lambda x: abs(x - linenum))
	739		return cand
	740
	741		def write_rej(self):
	742		# our rejects are a little different from patch(1). This always
	743		# creates rejects in the same form as the original patch. A file
	744		# header is inserted so that you can run the reject through patch again
	745		# without having to type the filename.
	746		if not self.rej:
	747		return
	748		base = os.path.basename(self.fname)
	749		lines = ["--- %s\n+++ %s\n" % (base, base)]
	750		for x in self.rej:
	751		for l in x.hunk:
	752		lines.append(l)
	753		if l[-1:] != '\n':
	754		lines.append("\n\ No newline at end of file\n")
	755		self.backend.writerej(self.fname, len(self.rej), self.hunks, lines)
	756
	757		def apply(self, h):
	758		if not h.complete():
	759		raise PatchError(_("bad hunk #%d %s (%d %d %d %d)") %
	760		(h.number, h.desc, len(h.a), h.lena, len(h.b),
	761		h.lenb))
	762
	763		self.hunks += 1
	764
	765		if self.missing:
	766		self.rej.append(h)
	767		return -1
	768
	769		if self.exists and self.create:
	770		if self.copysource:
	771		self.ui.warn(_("cannot create %s: destination already "
	772		"exists\n") % self.fname)
	773		else:
	774		self.ui.warn(_("file %s already exists\n") % self.fname)
	775		self.rej.append(h)
	776		return -1
	777
	778		if isinstance(h, binhunk):
	779		if self.remove:
	780		self.backend.unlink(self.fname)
	781		else:
	782		l = h.new(self.lines)
	783		self.lines[:] = l
	784		self.offset += len(l)
	785		self.dirty = True
	786		return 0
	787
	788		horig = h
	789		if (self.eolmode in ('crlf', 'lf')
	790		or self.eolmode == 'auto' and self.eol):
	791		# If new eols are going to be normalized, then normalize
	792		# hunk data before patching. Otherwise, preserve input
	793		# line-endings.
	794		h = h.getnormalized()
	795
	796		# fast case first, no offsets, no fuzz
	797		old, oldstart, new, newstart = h.fuzzit(0, False)
	798		oldstart += self.offset
	799		orig_start = oldstart
	800		# if there's skew we want to emit the "(offset %d lines)" even
	801		# when the hunk cleanly applies at start + skew, so skip the
	802		# fast case code
	803		if self.skew == 0 and diffhelper.testhunk(old, self.lines, oldstart):
	804		if self.remove:
	805		self.backend.unlink(self.fname)
	806		else:
	807		self.lines[oldstart:oldstart + len(old)] = new
	808		self.offset += len(new) - len(old)
	809		self.dirty = True
	810		return 0
	811
	812		# ok, we couldn't match the hunk. Lets look for offsets and fuzz it
	813		self.hash = {}
	814		for x, s in enumerate(self.lines):
	815		self.hash.setdefault(s, []).append(x)
	816
	817		for fuzzlen in xrange(self.ui.configint("patch", "fuzz") + 1):
	818		for toponly in [True, False]:
	819		old, oldstart, new, newstart = h.fuzzit(fuzzlen, toponly)
	820		oldstart = oldstart + self.offset + self.skew
	821		oldstart = min(oldstart, len(self.lines))
	822		if old:
	823		cand = self.findlines(old[0][1:], oldstart)
	824		else:
	825		# Only adding lines with no or fuzzed context, just
	826		# take the skew in account
	827		cand = [oldstart]
	828
	829		for l in cand:
	830		if not old or diffhelper.testhunk(old, self.lines, l):
	831		self.lines[l : l + len(old)] = new
	832		self.offset += len(new) - len(old)
	833		self.skew = l - orig_start
	834		self.dirty = True
	835		offset = l - orig_start - fuzzlen
	836		if fuzzlen:
	837		msg = _("Hunk #%d succeeded at %d "
	838		"with fuzz %d "
	839		"(offset %d lines).\n")
	840		self.printfile(True)
	841		self.ui.warn(msg %
	842		(h.number, l + 1, fuzzlen, offset))
	843		else:
	844		msg = _("Hunk #%d succeeded at %d "
	845		"(offset %d lines).\n")
	846		self.ui.note(msg % (h.number, l + 1, offset))
	847		return fuzzlen
	848		self.printfile(True)
	849		self.ui.warn(_("Hunk #%d FAILED at %d\n") % (h.number, orig_start))
	850		self.rej.append(horig)
	851		return -1
	852
	853		def close(self):
	854		if self.dirty:
	855		self.writelines(self.fname, self.lines, self.mode)
	856		self.write_rej()
	857		return len(self.rej)
	858
	859		class header(object):
	860		"""patch header
	861		"""
	862		diffgit_re = re.compile('diff --git a/(.) b/(.)$')
	863		diff_re = re.compile('diff -r .* (.*)$')
	864		allhunks_re = re.compile('(?:index\|deleted file) ')
	865		pretty_re = re.compile('(?:new file\|deleted file) ')
	866		special_re = re.compile('(?:index\|deleted\|copy\|rename) ')
	867		newfile_re = re.compile('(?:new file)')
	868
	869		def __init__(self, header):
	870		self.header = header
	871		self.hunks = []
	872
	873		def binary(self):
	874		return any(h.startswith('index ') for h in self.header)
	875
	876		def pretty(self, fp):
	877		for h in self.header:
	878		if h.startswith('index '):
	879		fp.write(_('this modifies a binary file (all or nothing)\n'))
	880		break
	881		if self.pretty_re.match(h):
	882		fp.write(h)
	883		if self.binary():
	884		fp.write(_('this is a binary file\n'))
	885		break
	886		if h.startswith('---'):
	887		fp.write(_('%d hunks, %d lines changed\n') %
	888		(len(self.hunks),
	889		sum([max(h.added, h.removed) for h in self.hunks])))
	890		break
	891		fp.write(h)
	892
	893		def write(self, fp):
	894		fp.write(''.join(self.header))
	895
	896		def allhunks(self):
	897		return any(self.allhunks_re.match(h) for h in self.header)
	898
	899		def files(self):
	900		match = self.diffgit_re.match(self.header[0])
	901		if match:
	902		fromfile, tofile = match.groups()
	903		if fromfile == tofile:
	904		return [fromfile]
	905		return [fromfile, tofile]
	906		else:
	907		return self.diff_re.match(self.header[0]).groups()
	908
	909		def filename(self):
	910		return self.files()[-1]
	911
	912		def __repr__(self):
	913		return '<header %s>' % (' '.join(map(repr, self.files())))
	914
	915		def isnewfile(self):
	916		return any(self.newfile_re.match(h) for h in self.header)
	917
	918		def special(self):
	919		# Special files are shown only at the header level and not at the hunk
	920		# level for example a file that has been deleted is a special file.
	921		# The user cannot change the content of the operation, in the case of
	922		# the deleted file he has to take the deletion or not take it, he
	923		# cannot take some of it.
	924		# Newly added files are special if they are empty, they are not special
	925		# if they have some content as we want to be able to change it
	926		nocontent = len(self.header) == 2
	927		emptynewfile = self.isnewfile() and nocontent
	928		return emptynewfile or \
	929		any(self.special_re.match(h) for h in self.header)
	930
	931		class recordhunk(object):
	932		"""patch hunk
	933
	934		XXX shouldn't we merge this with the other hunk class?
	935		"""
	936
	937		def __init__(self, header, fromline, toline, proc, before, hunk, after,
	938		maxcontext=None):
	939		def trimcontext(lines, reverse=False):
	940		if maxcontext is not None:
	941		delta = len(lines) - maxcontext
	942		if delta > 0:
	943		if reverse:
	944		return delta, lines[delta:]
	945		else:
	946		return delta, lines[:maxcontext]
	947		return 0, lines
	948
	949		self.header = header
	950		trimedbefore, self.before = trimcontext(before, True)
	951		self.fromline = fromline + trimedbefore
	952		self.toline = toline + trimedbefore
	953		_trimedafter, self.after = trimcontext(after, False)
	954		self.proc = proc
	955		self.hunk = hunk
	956		self.added, self.removed = self.countchanges(self.hunk)
	957
	958		def __eq__(self, v):
	959		if not isinstance(v, recordhunk):
	960		return False
	961
	962		return ((v.hunk == self.hunk) and
	963		(v.proc == self.proc) and
	964		(self.fromline == v.fromline) and
	965		(self.header.files() == v.header.files()))
	966
	967		def __hash__(self):
	968		return hash((tuple(self.hunk),
	969		tuple(self.header.files()),
	970		self.fromline,
	971		self.proc))
	972
	973		def countchanges(self, hunk):
	974		"""hunk -> (n+,n-)"""
	975		add = len([h for h in hunk if h.startswith('+')])
	976		rem = len([h for h in hunk if h.startswith('-')])
	977		return add, rem
	978
	979		def reversehunk(self):
	980		"""return another recordhunk which is the reverse of the hunk
	981
	982		If this hunk is diff(A, B), the returned hunk is diff(B, A). To do
	983		that, swap fromline/toline and +/- signs while keep other things
	984		unchanged.
	985		"""
	986		m = {'+': '-', '-': '+', '\\': '\\'}
	987		hunk = ['%s%s' % (m[l[0:1]], l[1:]) for l in self.hunk]
	988		return recordhunk(self.header, self.toline, self.fromline, self.proc,
	989		self.before, hunk, self.after)
	990
	991		def write(self, fp):
	992		delta = len(self.before) + len(self.after)
	993		if self.after and self.after[-1] == '\\ No newline at end of file\n':
	994		delta -= 1
	995		fromlen = delta + self.removed
	996		tolen = delta + self.added
	997		fp.write('@@ -%d,%d +%d,%d @@%s\n' %
	998		(self.fromline, fromlen, self.toline, tolen,
	999		self.proc and (' ' + self.proc)))
	1000		fp.write(''.join(self.before + self.hunk + self.after))
	1001
	1002		pretty = write
	1003
	1004		def filename(self):
	1005		return self.header.filename()
	1006
	1007		def __repr__(self):
	1008		return '<hunk %r@%d>' % (self.filename(), self.fromline)
	1009
	1010		def getmessages():
	1011		return {
	1012		'multiple': {
	1013		'apply': _("apply change %d/%d to '%s'?"),
	1014		'discard': _("discard change %d/%d to '%s'?"),
	1015		'record': _("record change %d/%d to '%s'?"),
	1016		},
	1017		'single': {
	1018		'apply': _("apply this change to '%s'?"),
	1019		'discard': _("discard this change to '%s'?"),
	1020		'record': _("record this change to '%s'?"),
	1021		},
	1022		'help': {
	1023		'apply': _('[Ynesfdaq?]'
	1024		'$$ &Yes, apply this change'
	1025		'$$ &No, skip this change'
	1026		'$$ &Edit this change manually'
	1027		'$$ &Skip remaining changes to this file'
	1028		'$$ Apply remaining changes to this &file'
	1029		'$$ &Done, skip remaining changes and files'
	1030		'$$ Apply &all changes to all remaining files'
	1031		'$$ &Quit, applying no changes'
	1032		'$$ &? (display help)'),
	1033		'discard': _('[Ynesfdaq?]'
	1034		'$$ &Yes, discard this change'
	1035		'$$ &No, skip this change'
	1036		'$$ &Edit this change manually'
	1037		'$$ &Skip remaining changes to this file'
	1038		'$$ Discard remaining changes to this &file'
	1039		'$$ &Done, skip remaining changes and files'
	1040		'$$ Discard &all changes to all remaining files'
	1041		'$$ &Quit, discarding no changes'
	1042		'$$ &? (display help)'),
	1043		'record': _('[Ynesfdaq?]'
	1044		'$$ &Yes, record this change'
	1045		'$$ &No, skip this change'
	1046		'$$ &Edit this change manually'
	1047		'$$ &Skip remaining changes to this file'
	1048		'$$ Record remaining changes to this &file'
	1049		'$$ &Done, skip remaining changes and files'
	1050		'$$ Record &all changes to all remaining files'
	1051		'$$ &Quit, recording no changes'
	1052		'$$ &? (display help)'),
	1053		}
	1054		}
	1055
	1056		def filterpatch(ui, headers, operation=None):
	1057		"""Interactively filter patch chunks into applied-only chunks"""
	1058		messages = getmessages()
	1059
	1060		if operation is None:
	1061		operation = 'record'
	1062
	1063		def prompt(skipfile, skipall, query, chunk):
	1064		"""prompt query, and process base inputs
	1065
	1066		- y/n for the rest of file
	1067		- y/n for the rest
	1068		- ? (help)
	1069		- q (quit)
	1070
	1071		Return True/False and possibly updated skipfile and skipall.
	1072		"""
	1073		newpatches = None
	1074		if skipall is not None:
	1075		return skipall, skipfile, skipall, newpatches
	1076		if skipfile is not None:
	1077		return skipfile, skipfile, skipall, newpatches
	1078		while True:
	1079		resps = messages['help'][operation]
	1080		r = ui.promptchoice("%s %s" % (query, resps))
	1081		ui.write("\n")
	1082		if r == 8: # ?
	1083		for c, t in ui.extractchoices(resps)[1]:
	1084		ui.write('%s - %s\n' % (c, encoding.lower(t)))
	1085		continue
	1086		elif r == 0: # yes
	1087		ret = True
	1088		elif r == 1: # no
	1089		ret = False
	1090		elif r == 2: # Edit patch
	1091		if chunk is None:
	1092		ui.write(_('cannot edit patch for whole file'))
	1093		ui.write("\n")
	1094		continue
	1095		if chunk.header.binary():
	1096		ui.write(_('cannot edit patch for binary file'))
	1097		ui.write("\n")
	1098		continue
	1099		# Patch comment based on the Git one (based on comment at end of
	1100		# https://mercurial-scm.org/wiki/RecordExtension)
	1101		phelp = '---' + _("""
	1102		To remove '-' lines, make them ' ' lines (context).
	1103		To remove '+' lines, delete them.
	1104		Lines starting with # will be removed from the patch.
		12	from ..i18n import _
	1105	13
	1106		If the patch applies cleanly, the edited hunk will immediately be
	1107		added to the record list. If it does not apply cleanly, a rejects
	1108		file will be generated: you can use that when you try again. If
	1109		all lines of the hunk are removed, then the edit is aborted and
	1110		the hunk is left unchanged.
	1111		""")
	1112		(patchfd, patchfn) = pycompat.mkstemp(prefix="hg-editor-",
	1113		suffix=".diff")
	1114		ncpatchfp = None
	1115		try:
	1116		# Write the initial patch
	1117		f = util.nativeeolwriter(os.fdopen(patchfd, r'wb'))
	1118		chunk.header.write(f)
	1119		chunk.write(f)
	1120		f.write('\n'.join(['# ' + i for i in phelp.splitlines()]))
	1121		f.close()
	1122		# Start the editor and wait for it to complete
	1123		editor = ui.geteditor()
	1124		ret = ui.system("%s \"%s\"" % (editor, patchfn),
	1125		environ={'HGUSER': ui.username()},
	1126		blockedtag='filterpatch')
	1127		if ret != 0:
	1128		ui.warn(_("editor exited with exit code %d\n") % ret)
	1129		continue
	1130		# Remove comment lines
	1131		patchfp = open(patchfn, r'rb')
	1132		ncpatchfp = stringio()
	1133		for line in util.iterfile(patchfp):
	1134		line = util.fromnativeeol(line)
	1135		if not line.startswith('#'):
	1136		ncpatchfp.write(line)
	1137		patchfp.close()
	1138		ncpatchfp.seek(0)
	1139		newpatches = parsepatch(ncpatchfp)
	1140		finally:
	1141		os.unlink(patchfn)
	1142		del ncpatchfp
	1143		# Signal that the chunk shouldn't be applied as-is, but
	1144		# provide the new patch to be used instead.
	1145		ret = False
	1146		elif r == 3: # Skip
	1147		ret = skipfile = False
	1148		elif r == 4: # file (Record remaining)
	1149		ret = skipfile = True
	1150		elif r == 5: # done, skip remaining
	1151		ret = skipall = False
	1152		elif r == 6: # all
	1153		ret = skipall = True
	1154		elif r == 7: # quit
	1155		raise error.Abort(_('user quit'))
	1156		return ret, skipfile, skipall, newpatches
	1157
	1158		seen = set()
	1159		applied = {} # 'filename' -> [] of chunks
	1160		skipfile, skipall = None, None
	1161		pos, total = 1, sum(len(h.hunks) for h in headers)
	1162		for h in headers:
	1163		pos += len(h.hunks)
	1164		skipfile = None
	1165		fixoffset = 0
	1166		hdr = ''.join(h.header)
	1167		if hdr in seen:
	1168		continue
	1169		seen.add(hdr)
	1170		if skipall is None:
	1171		h.pretty(ui)
	1172		msg = (_('examine changes to %s?') %
	1173		_(' and ').join("'%s'" % f for f in h.files()))
	1174		r, skipfile, skipall, np = prompt(skipfile, skipall, msg, None)
	1175		if not r:
	1176		continue
	1177		applied[h.filename()] = [h]
	1178		if h.allhunks():
	1179		applied[h.filename()] += h.hunks
	1180		continue
	1181		for i, chunk in enumerate(h.hunks):
	1182		if skipfile is None and skipall is None:
	1183		chunk.pretty(ui)
	1184		if total == 1:
	1185		msg = messages['single'][operation] % chunk.filename()
	1186		else:
	1187		idx = pos - len(h.hunks) + i
	1188		msg = messages['multiple'][operation] % (idx, total,
	1189		chunk.filename())
	1190		r, skipfile, skipall, newpatches = prompt(skipfile,
	1191		skipall, msg, chunk)
	1192		if r:
	1193		if fixoffset:
	1194		chunk = copy.copy(chunk)
	1195		chunk.toline += fixoffset
	1196		applied[chunk.filename()].append(chunk)
	1197		elif newpatches is not None:
	1198		for newpatch in newpatches:
	1199		for newhunk in newpatch.hunks:
	1200		if fixoffset:
	1201		newhunk.toline += fixoffset
	1202		applied[newhunk.filename()].append(newhunk)
	1203		else:
	1204		fixoffset += chunk.removed - chunk.added
	1205		return (sum([h for h in applied.itervalues()
	1206		if h[0].special() or len(h) > 1], []), {})
	1207		class hunk(object):
	1208		def __init__(self, desc, num, lr, context):
	1209		self.number = num
	1210		self.desc = desc
	1211		self.hunk = [desc]
	1212		self.a = []
	1213		self.b = []
	1214		self.starta = self.lena = None
	1215		self.startb = self.lenb = None
	1216		if lr is not None:
	1217		if context:
	1218		self.read_context_hunk(lr)
	1219		else:
	1220		self.read_unified_hunk(lr)
	1221
	1222		def getnormalized(self):
	1223		"""Return a copy with line endings normalized to LF."""
	1224
	1225		def normalize(lines):
	1226		nlines = []
	1227		for line in lines:
	1228		if line.endswith('\r\n'):
	1229		line = line[:-2] + '\n'
	1230		nlines.append(line)
	1231		return nlines
	1232
	1233		# Dummy object, it is rebuilt manually
	1234		nh = hunk(self.desc, self.number, None, None)
	1235		nh.number = self.number
	1236		nh.desc = self.desc
	1237		nh.hunk = self.hunk
	1238		nh.a = normalize(self.a)
	1239		nh.b = normalize(self.b)
	1240		nh.starta = self.starta
	1241		nh.startb = self.startb
	1242		nh.lena = self.lena
	1243		nh.lenb = self.lenb
	1244		return nh
	1245
	1246		def read_unified_hunk(self, lr):
	1247		m = unidesc.match(self.desc)
	1248		if not m:
	1249		raise PatchError(_("bad hunk #%d") % self.number)
	1250		self.starta, self.lena, self.startb, self.lenb = m.groups()
	1251		if self.lena is None:
	1252		self.lena = 1
	1253		else:
	1254		self.lena = int(self.lena)
	1255		if self.lenb is None:
	1256		self.lenb = 1
	1257		else:
	1258		self.lenb = int(self.lenb)
	1259		self.starta = int(self.starta)
	1260		self.startb = int(self.startb)
	1261		try:
	1262		diffhelper.addlines(lr, self.hunk, self.lena, self.lenb,
	1263		self.a, self.b)
	1264		except error.ParseError as e:
	1265		raise PatchError(_("bad hunk #%d: %s") % (self.number, e))
	1266		# if we hit eof before finishing out the hunk, the last line will
	1267		# be zero length. Lets try to fix it up.
	1268		while len(self.hunk[-1]) == 0:
	1269		del self.hunk[-1]
	1270		del self.a[-1]
	1271		del self.b[-1]
	1272		self.lena -= 1
	1273		self.lenb -= 1
	1274		self._fixnewline(lr)
	1275
	1276		def read_context_hunk(self, lr):
	1277		self.desc = lr.readline()
	1278		m = contextdesc.match(self.desc)
	1279		if not m:
	1280		raise PatchError(_("bad hunk #%d") % self.number)
	1281		self.starta, aend = m.groups()
	1282		self.starta = int(self.starta)
	1283		if aend is None:
	1284		aend = self.starta
	1285		self.lena = int(aend) - self.starta
	1286		if self.starta:
	1287		self.lena += 1
	1288		for x in xrange(self.lena):
	1289		l = lr.readline()
	1290		if l.startswith('---'):
	1291		# lines addition, old block is empty
	1292		lr.push(l)
	1293		break
	1294		s = l[2:]
	1295		if l.startswith('- ') or l.startswith('! '):
	1296		u = '-' + s
	1297		elif l.startswith(' '):
	1298		u = ' ' + s
	1299		else:
	1300		raise PatchError(_("bad hunk #%d old text line %d") %
	1301		(self.number, x))
	1302		self.a.append(u)
	1303		self.hunk.append(u)
	1304
	1305		l = lr.readline()
	1306		if l.startswith('\ '):
	1307		s = self.a[-1][:-1]
	1308		self.a[-1] = s
	1309		self.hunk[-1] = s
	1310		l = lr.readline()
	1311		m = contextdesc.match(l)
	1312		if not m:
	1313		raise PatchError(_("bad hunk #%d") % self.number)
	1314		self.startb, bend = m.groups()
	1315		self.startb = int(self.startb)
	1316		if bend is None:
	1317		bend = self.startb
	1318		self.lenb = int(bend) - self.startb
	1319		if self.startb:
	1320		self.lenb += 1
	1321		hunki = 1
	1322		for x in xrange(self.lenb):
	1323		l = lr.readline()
	1324		if l.startswith('\ '):
	1325		# XXX: the only way to hit this is with an invalid line range.
	1326		# The no-eol marker is not counted in the line range, but I
	1327		# guess there are diff(1) out there which behave differently.
	1328		s = self.b[-1][:-1]
	1329		self.b[-1] = s
	1330		self.hunk[hunki - 1] = s
	1331		continue
	1332		if not l:
	1333		# line deletions, new block is empty and we hit EOF
	1334		lr.push(l)
	1335		break
	1336		s = l[2:]
	1337		if l.startswith('+ ') or l.startswith('! '):
	1338		u = '+' + s
	1339		elif l.startswith(' '):
	1340		u = ' ' + s
	1341		elif len(self.b) == 0:
	1342		# line deletions, new block is empty
	1343		lr.push(l)
	1344		break
	1345		else:
	1346		raise PatchError(_("bad hunk #%d old text line %d") %
	1347		(self.number, x))
	1348		self.b.append(s)
	1349		while True:
	1350		if hunki >= len(self.hunk):
	1351		h = ""
	1352		else:
	1353		h = self.hunk[hunki]
	1354		hunki += 1
	1355		if h == u:
	1356		break
	1357		elif h.startswith('-'):
	1358		continue
	1359		else:
	1360		self.hunk.insert(hunki - 1, u)
	1361		break
	1362
	1363		if not self.a:
	1364		# this happens when lines were only added to the hunk
	1365		for x in self.hunk:
	1366		if x.startswith('-') or x.startswith(' '):
	1367		self.a.append(x)
	1368		if not self.b:
	1369		# this happens when lines were only deleted from the hunk
	1370		for x in self.hunk:
	1371		if x.startswith('+') or x.startswith(' '):
	1372		self.b.append(x[1:])
	1373		# @@ -start,len +start,len @@
	1374		self.desc = "@@ -%d,%d +%d,%d @@\n" % (self.starta, self.lena,
	1375		self.startb, self.lenb)
	1376		self.hunk[0] = self.desc
	1377		self._fixnewline(lr)
	1378
	1379		def _fixnewline(self, lr):
	1380		l = lr.readline()
	1381		if l.startswith('\ '):
	1382		diffhelper.fixnewline(self.hunk, self.a, self.b)
	1383		else:
	1384		lr.push(l)
	1385
	1386		def complete(self):
	1387		return len(self.a) == self.lena and len(self.b) == self.lenb
	1388
	1389		def _fuzzit(self, old, new, fuzz, toponly):
	1390		# this removes context lines from the top and bottom of list 'l'. It
	1391		# checks the hunk to make sure only context lines are removed, and then
	1392		# returns a new shortened list of lines.
	1393		fuzz = min(fuzz, len(old))
	1394		if fuzz:
	1395		top = 0
	1396		bot = 0
	1397		hlen = len(self.hunk)
	1398		for x in xrange(hlen - 1):
	1399		# the hunk starts with the @@ line, so use x+1
	1400		if self.hunk[x + 1].startswith(' '):
	1401		top += 1
	1402		else:
	1403		break
	1404		if not toponly:
	1405		for x in xrange(hlen - 1):
	1406		if self.hunk[hlen - bot - 1].startswith(' '):
	1407		bot += 1
	1408		else:
	1409		break
	1410
	1411		bot = min(fuzz, bot)
	1412		top = min(fuzz, top)
	1413		return old[top:len(old) - bot], new[top:len(new) - bot], top
	1414		return old, new, 0
	1415
	1416		def fuzzit(self, fuzz, toponly):
	1417		old, new, top = self._fuzzit(self.a, self.b, fuzz, toponly)
	1418		oldstart = self.starta + top
	1419		newstart = self.startb + top
	1420		# zero length hunk ranges already have their start decremented
	1421		if self.lena and oldstart > 0:
	1422		oldstart -= 1
	1423		if self.lenb and newstart > 0:
	1424		newstart -= 1
	1425		return old, oldstart, new, newstart
	1426
	1427		class binhunk(object):
	1428		'A binary patch file.'
	1429		def __init__(self, lr, fname):
	1430		self.text = None
	1431		self.delta = False
	1432		self.hunk = ['GIT binary patch\n']
	1433		self._fname = fname
	1434		self._read(lr)
	1435
	1436		def complete(self):
	1437		return self.text is not None
	1438
	1439		def new(self, lines):
	1440		if self.delta:
	1441		return [applybindelta(self.text, ''.join(lines))]
	1442		return [self.text]
	1443
	1444		def _read(self, lr):
	1445		def getline(lr, hunk):
	1446		l = lr.readline()
	1447		hunk.append(l)
	1448		return l.rstrip('\r\n')
	1449
	1450		size = 0
	1451		while True:
	1452		line = getline(lr, self.hunk)
	1453		if not line:
	1454		raise PatchError(_('could not extract "%s" binary data')
	1455		% self._fname)
	1456		if line.startswith('literal '):
	1457		size = int(line[8:].rstrip())
	1458		break
	1459		if line.startswith('delta '):
	1460		size = int(line[6:].rstrip())
	1461		self.delta = True
	1462		break
	1463		dec = []
	1464		line = getline(lr, self.hunk)
	1465		while len(line) > 1:
	1466		l = line[0:1]
	1467		if l <= 'Z' and l >= 'A':
	1468		l = ord(l) - ord('A') + 1
	1469		else:
	1470		l = ord(l) - ord('a') + 27
	1471		try:
	1472		dec.append(util.b85decode(line[1:])[:l])
	1473		except ValueError as e:
	1474		raise PatchError(_('could not decode "%s" binary patch: %s')
	1475		% (self._fname, stringutil.forcebytestr(e)))
	1476		line = getline(lr, self.hunk)
	1477		text = zlib.decompress(''.join(dec))
	1478		if len(text) != size:
	1479		raise PatchError(_('"%s" length is %d bytes, should be %d')
	1480		% (self._fname, len(text), size))
	1481		self.text = text
	1482
	1483		def parsefilename(str):
	1484		# --- filename \t\|space stuff
	1485		s = str[4:].rstrip('\r\n')
	1486		i = s.find('\t')
	1487		if i < 0:
	1488		i = s.find(' ')
	1489		if i < 0:
	1490		return s
	1491		return s[:i]
	1492
	1493		def reversehunks(hunks):
	1494		'''reverse the signs in the hunks given as argument
	1495
	1496		This function operates on hunks coming out of patch.filterpatch, that is
	1497		a list of the form: [header1, hunk1, hunk2, header2...]. Example usage:
	1498
	1499		>>> rawpatch = b"""diff --git a/folder1/g b/folder1/g
	1500		... --- a/folder1/g
	1501		... +++ b/folder1/g
	1502		... @@ -1,7 +1,7 @@
	1503		... +firstline
	1504		... c
	1505		... 1
	1506		... 2
	1507		... + 3
	1508		... -4
	1509		... 5
	1510		... d
	1511		... +lastline"""
	1512		>>> hunks = parsepatch([rawpatch])
	1513		>>> hunkscomingfromfilterpatch = []
	1514		>>> for h in hunks:
	1515		... hunkscomingfromfilterpatch.append(h)
	1516		... hunkscomingfromfilterpatch.extend(h.hunks)
	1517
	1518		>>> reversedhunks = reversehunks(hunkscomingfromfilterpatch)
	1519		>>> from . import util
	1520		>>> fp = util.stringio()
	1521		>>> for c in reversedhunks:
	1522		... c.write(fp)
	1523		>>> fp.seek(0) or None
	1524		>>> reversedpatch = fp.read()
	1525		>>> print(pycompat.sysstr(reversedpatch))
	1526		diff --git a/folder1/g b/folder1/g
	1527		--- a/folder1/g
	1528		+++ b/folder1/g
	1529		@@ -1,4 +1,3 @@
	1530		-firstline
	1531		c
	1532		1
	1533		2
	1534		@@ -2,6 +1,6 @@
	1535		c
	1536		1
	1537		2
	1538		- 3
	1539		+4
	1540		5
	1541		d
	1542		@@ -6,3 +5,2 @@
	1543		5
	1544		d
	1545		-lastline
	1546
	1547		'''
	1548
	1549		newhunks = []
	1550		for c in hunks:
	1551		if util.safehasattr(c, 'reversehunk'):
	1552		c = c.reversehunk()
	1553		newhunks.append(c)
	1554		return newhunks
	1555
	1556		def parsepatch(originalchunks, maxcontext=None):
	1557		"""patch -> [] of headers -> [] of hunks
	1558
	1559		If maxcontext is not None, trim context lines if necessary.
	1560
	1561		>>> rawpatch = b'''diff --git a/folder1/g b/folder1/g
	1562		... --- a/folder1/g
	1563		... +++ b/folder1/g
	1564		... @@ -1,8 +1,10 @@
	1565		... 1
	1566		... 2
	1567		... -3
	1568		... 4
	1569		... 5
	1570		... 6
	1571		... +6.1
	1572		... +6.2
	1573		... 7
	1574		... 8
	1575		... +9'''
	1576		>>> out = util.stringio()
	1577		>>> headers = parsepatch([rawpatch], maxcontext=1)
	1578		>>> for header in headers:
	1579		... header.write(out)
	1580		... for hunk in header.hunks:
	1581		... hunk.write(out)
	1582		>>> print(pycompat.sysstr(out.getvalue()))
	1583		diff --git a/folder1/g b/folder1/g
	1584		--- a/folder1/g
	1585		+++ b/folder1/g
	1586		@@ -2,3 +2,2 @@
	1587		2
	1588		-3
	1589		4
	1590		@@ -6,2 +5,4 @@
	1591		6
	1592		+6.1
	1593		+6.2
	1594		7
	1595		@@ -8,1 +9,2 @@
	1596		8
	1597		+9
	1598		"""
	1599		class parser(object):
	1600		"""patch parsing state machine"""
	1601		def __init__(self):
	1602		self.fromline = 0
	1603		self.toline = 0
	1604		self.proc = ''
	1605		self.header = None
	1606		self.context = []
	1607		self.before = []
	1608		self.hunk = []
	1609		self.headers = []
	1610
	1611		def addrange(self, limits):
	1612		fromstart, fromend, tostart, toend, proc = limits
	1613		self.fromline = int(fromstart)
	1614		self.toline = int(tostart)
	1615		self.proc = proc
	1616
	1617		def addcontext(self, context):
	1618		if self.hunk:
	1619		h = recordhunk(self.header, self.fromline, self.toline,
	1620		self.proc, self.before, self.hunk, context, maxcontext)
	1621		self.header.hunks.append(h)
	1622		self.fromline += len(self.before) + h.removed
	1623		self.toline += len(self.before) + h.added
	1624		self.before = []
	1625		self.hunk = []
	1626		self.context = context
	1627
	1628		def addhunk(self, hunk):
	1629		if self.context:
	1630		self.before = self.context
	1631		self.context = []
	1632		self.hunk = hunk
	1633
	1634		def newfile(self, hdr):
	1635		self.addcontext([])
	1636		h = header(hdr)
	1637		self.headers.append(h)
	1638		self.header = h
	1639
	1640		def addother(self, line):
	1641		pass # 'other' lines are ignored
	1642
	1643		def finished(self):
	1644		self.addcontext([])
	1645		return self.headers
	1646
	1647		transitions = {
	1648		'file': {'context': addcontext,
	1649		'file': newfile,
	1650		'hunk': addhunk,
	1651		'range': addrange},
	1652		'context': {'file': newfile,
	1653		'hunk': addhunk,
	1654		'range': addrange,
	1655		'other': addother},
	1656		'hunk': {'context': addcontext,
	1657		'file': newfile,
	1658		'range': addrange},
	1659		'range': {'context': addcontext,
	1660		'hunk': addhunk},
	1661		'other': {'other': addother},
	1662		}
	1663
	1664		p = parser()
	1665		fp = stringio()
	1666		fp.write(''.join(originalchunks))
	1667		fp.seek(0)
	1668
	1669		state = 'context'
	1670		for newstate, data in scanpatch(fp):
	1671		try:
	1672		p.transitions[state][newstate](p, data)
	1673		except KeyError:
	1674		raise PatchError('unhandled transition: %s -> %s' %
	1675		(state, newstate))
	1676		state = newstate
	1677		del fp
	1678		return p.finished()
	1679
	1680		def pathtransform(path, strip, prefix):
	1681		'''turn a path from a patch into a path suitable for the repository
	1682
	1683		prefix, if not empty, is expected to be normalized with a / at the end.
	1684
	1685		Returns (stripped components, path in repository).
	1686
	1687		>>> pathtransform(b'a/b/c', 0, b'')
	1688		('', 'a/b/c')
	1689		>>> pathtransform(b' a/b/c ', 0, b'')
	1690		('', ' a/b/c')
	1691		>>> pathtransform(b' a/b/c ', 2, b'')
	1692		('a/b/', 'c')
	1693		>>> pathtransform(b'a/b/c', 0, b'd/e/')
	1694		('', 'd/e/a/b/c')
	1695		>>> pathtransform(b' a//b/c ', 2, b'd/e/')
	1696		('a//b/', 'd/e/c')
	1697		>>> pathtransform(b'a/b/c', 3, b'')
	1698		Traceback (most recent call last):
	1699		PatchError: unable to strip away 1 of 3 dirs from a/b/c
	1700		'''
	1701		pathlen = len(path)
	1702		i = 0
	1703		if strip == 0:
	1704		return '', prefix + path.rstrip()
	1705		count = strip
	1706		while count > 0:
	1707		i = path.find('/', i)
	1708		if i == -1:
	1709		raise PatchError(_("unable to strip away %d of %d dirs from %s") %
	1710		(count, strip, path))
	1711		i += 1
	1712		# consume '//' in the path
	1713		while i < pathlen - 1 and path[i:i + 1] == '/':
	1714		i += 1
	1715		count -= 1
	1716		return path[:i].lstrip(), prefix + path[i:].rstrip()
	1717
	1718		def makepatchmeta(backend, afile_orig, bfile_orig, hunk, strip, prefix):
	1719		nulla = afile_orig == "/dev/null"
	1720		nullb = bfile_orig == "/dev/null"
	1721		create = nulla and hunk.starta == 0 and hunk.lena == 0
	1722		remove = nullb and hunk.startb == 0 and hunk.lenb == 0
	1723		abase, afile = pathtransform(afile_orig, strip, prefix)
	1724		gooda = not nulla and backend.exists(afile)
	1725		bbase, bfile = pathtransform(bfile_orig, strip, prefix)
	1726		if afile == bfile:
	1727		goodb = gooda
	1728		else:
	1729		goodb = not nullb and backend.exists(bfile)
	1730		missing = not goodb and not gooda and not create
	1731
	1732		# some diff programs apparently produce patches where the afile is
	1733		# not /dev/null, but afile starts with bfile
	1734		abasedir = afile[:afile.rfind('/') + 1]
	1735		bbasedir = bfile[:bfile.rfind('/') + 1]
	1736		if (missing and abasedir == bbasedir and afile.startswith(bfile)
	1737		and hunk.starta == 0 and hunk.lena == 0):
	1738		create = True
	1739		missing = False
	1740
	1741		# If afile is "a/b/foo" and bfile is "a/b/foo.orig" we assume the
	1742		# diff is between a file and its backup. In this case, the original
	1743		# file should be patched (see original mpatch code).
	1744		isbackup = (abase == bbase and bfile.startswith(afile))
	1745		fname = None
	1746		if not missing:
	1747		if gooda and goodb:
	1748		if isbackup:
	1749		fname = afile
	1750		else:
	1751		fname = bfile
	1752		elif gooda:
	1753		fname = afile
	1754
	1755		if not fname:
	1756		if not nullb:
	1757		if isbackup:
	1758		fname = afile
	1759		else:
	1760		fname = bfile
	1761		elif not nulla:
	1762		fname = afile
	1763		else:
	1764		raise PatchError(_("undefined source and destination files"))
	1765
	1766		gp = patchmeta(fname)
	1767		if create:
	1768		gp.op = 'ADD'
	1769		elif remove:
	1770		gp.op = 'DELETE'
	1771		return gp
	1772
	1773		def scanpatch(fp):
	1774		"""like patch.iterhunks, but yield different events
	1775
	1776		- ('file', [header_lines + fromfile + tofile])
	1777		- ('context', [context_lines])
	1778		- ('hunk', [hunk_lines])
	1779		- ('range', (-start,len, +start,len, proc))
	1780		"""
	1781		lines_re = re.compile(br'@@ -(\d+),(\d+) \+(\d+),(\d+) @@\s(.)')
	1782		lr = linereader(fp)
	1783
	1784		def scanwhile(first, p):
	1785		"""scan lr while predicate holds"""
	1786		lines = [first]
	1787		for line in iter(lr.readline, ''):
	1788		if p(line):
	1789		lines.append(line)
	1790		else:
	1791		lr.push(line)
	1792		break
	1793		return lines
	1794
	1795		for line in iter(lr.readline, ''):
	1796		if line.startswith('diff --git a/') or line.startswith('diff -r '):
	1797		def notheader(line):
	1798		s = line.split(None, 1)
	1799		return not s or s[0] not in ('---', 'diff')
	1800		header = scanwhile(line, notheader)
	1801		fromfile = lr.readline()
	1802		if fromfile.startswith('---'):
	1803		tofile = lr.readline()
	1804		header += [fromfile, tofile]
	1805		else:
	1806		lr.push(fromfile)
	1807		yield 'file', header
	1808		elif line.startswith(' '):
	1809		cs = (' ', '\\')
	1810		yield 'context', scanwhile(line, lambda l: l.startswith(cs))
	1811		elif line.startswith(('-', '+')):
	1812		cs = ('-', '+', '\\')
	1813		yield 'hunk', scanwhile(line, lambda l: l.startswith(cs))
	1814		else:
	1815		m = lines_re.match(line)
	1816		if m:
	1817		yield 'range', m.groups()
	1818		else:
	1819		yield 'other', line
	1820
	1821		def scangitpatch(lr, firstline):
	1822		"""
	1823		Git patches can emit:
	1824		- rename a to b
	1825		- change b
	1826		- copy a to c
	1827		- change c
	1828
	1829		We cannot apply this sequence as-is, the renamed 'a' could not be
	1830		found for it would have been renamed already. And we cannot copy
	1831		from 'b' instead because 'b' would have been changed already. So
	1832		we scan the git patch for copy and rename commands so we can
	1833		perform the copies ahead of time.
	1834		"""
	1835		pos = 0
	1836		try:
	1837		pos = lr.fp.tell()
	1838		fp = lr.fp
	1839		except IOError:
	1840		fp = stringio(lr.fp.read())
	1841		gitlr = linereader(fp)
	1842		gitlr.push(firstline)
	1843		gitpatches = readgitpatch(gitlr)
	1844		fp.seek(pos)
	1845		return gitpatches
	1846
	1847		def iterhunks(fp):
	1848		"""Read a patch and yield the following events:
	1849		- ("file", afile, bfile, firsthunk): select a new target file.
	1850		- ("hunk", hunk): a new hunk is ready to be applied, follows a
	1851		"file" event.
	1852		- ("git", gitchanges): current diff is in git format, gitchanges
	1853		maps filenames to gitpatch records. Unique event.
	1854		"""
	1855		afile = ""
	1856		bfile = ""
	1857		state = None
	1858		hunknum = 0
	1859		emitfile = newfile = False
	1860		gitpatches = None
	1861
	1862		# our states
	1863		BFILE = 1
	1864		context = None
	1865		lr = linereader(fp)
	1866
	1867		for x in iter(lr.readline, ''):
	1868		if state == BFILE and (
	1869		(not context and x.startswith('@'))
	1870		or (context is not False and x.startswith('***************'))
	1871		or x.startswith('GIT binary patch')):
	1872		gp = None
	1873		if (gitpatches and
	1874		gitpatches[-1].ispatching(afile, bfile)):
	1875		gp = gitpatches.pop()
	1876		if x.startswith('GIT binary patch'):
	1877		h = binhunk(lr, gp.path)
	1878		else:
	1879		if context is None and x.startswith('***************'):
	1880		context = True
	1881		h = hunk(x, hunknum + 1, lr, context)
	1882		hunknum += 1
	1883		if emitfile:
	1884		emitfile = False
	1885		yield 'file', (afile, bfile, h, gp and gp.copy() or None)
	1886		yield 'hunk', h
	1887		elif x.startswith('diff --git a/'):
	1888		m = gitre.match(x.rstrip(' \r\n'))
	1889		if not m:
	1890		continue
	1891		if gitpatches is None:
	1892		# scan whole input for git metadata
	1893		gitpatches = scangitpatch(lr, x)
	1894		yield 'git', [g.copy() for g in gitpatches
	1895		if g.op in ('COPY', 'RENAME')]
	1896		gitpatches.reverse()
	1897		afile = 'a/' + m.group(1)
	1898		bfile = 'b/' + m.group(2)
	1899		while gitpatches and not gitpatches[-1].ispatching(afile, bfile):
	1900		gp = gitpatches.pop()
	1901		yield 'file', ('a/' + gp.path, 'b/' + gp.path, None, gp.copy())
	1902		if not gitpatches:
	1903		raise PatchError(_('failed to synchronize metadata for "%s"')
	1904		% afile[2:])
	1905		gp = gitpatches[-1]
	1906		newfile = True
	1907		elif x.startswith('---'):
	1908		# check for a unified diff
	1909		l2 = lr.readline()
	1910		if not l2.startswith('+++'):
	1911		lr.push(l2)
	1912		continue
	1913		newfile = True
	1914		context = False
	1915		afile = parsefilename(x)
	1916		bfile = parsefilename(l2)
	1917		elif x.startswith('***'):
	1918		# check for a context diff
	1919		l2 = lr.readline()
	1920		if not l2.startswith('---'):
	1921		lr.push(l2)
	1922		continue
	1923		l3 = lr.readline()
	1924		lr.push(l3)
	1925		if not l3.startswith("***************"):
	1926		lr.push(l2)
	1927		continue
	1928		newfile = True
	1929		context = True
	1930		afile = parsefilename(x)
	1931		bfile = parsefilename(l2)
	1932
	1933		if newfile:
	1934		newfile = False
	1935		emitfile = True
	1936		state = BFILE
	1937		hunknum = 0
	1938
	1939		while gitpatches:
	1940		gp = gitpatches.pop()
	1941		yield 'file', ('a/' + gp.path, 'b/' + gp.path, None, gp.copy())
	1942
	1943		def applybindelta(binchunk, data):
	1944		"""Apply a binary delta hunk
	1945		The algorithm used is the algorithm from git's patch-delta.c
	1946		"""
	1947		def deltahead(binchunk):
	1948		i = 0
	1949		for c in pycompat.bytestr(binchunk):
	1950		i += 1
	1951		if not (ord(c) & 0x80):
	1952		return i
	1953		return i
	1954		out = ""
	1955		s = deltahead(binchunk)
	1956		binchunk = binchunk[s:]
	1957		s = deltahead(binchunk)
	1958		binchunk = binchunk[s:]
	1959		i = 0
	1960		while i < len(binchunk):
	1961		cmd = ord(binchunk[i:i + 1])
	1962		i += 1
	1963		if (cmd & 0x80):
	1964		offset = 0
	1965		size = 0
	1966		if (cmd & 0x01):
	1967		offset = ord(binchunk[i:i + 1])
	1968		i += 1
	1969		if (cmd & 0x02):
	1970		offset \|= ord(binchunk[i:i + 1]) << 8
	1971		i += 1
	1972		if (cmd & 0x04):
	1973		offset \|= ord(binchunk[i:i + 1]) << 16
	1974		i += 1
	1975		if (cmd & 0x08):
	1976		offset \|= ord(binchunk[i:i + 1]) << 24
	1977		i += 1
	1978		if (cmd & 0x10):
	1979		size = ord(binchunk[i:i + 1])
	1980		i += 1
	1981		if (cmd & 0x20):
	1982		size \|= ord(binchunk[i:i + 1]) << 8
	1983		i += 1
	1984		if (cmd & 0x40):
	1985		size \|= ord(binchunk[i:i + 1]) << 16
	1986		i += 1
	1987		if size == 0:
	1988		size = 0x10000
	1989		offset_end = offset + size
	1990		out += data[offset:offset_end]
	1991		elif cmd != 0:
	1992		offset_end = i + cmd
	1993		out += binchunk[i:offset_end]
	1994		i += cmd
	1995		else:
	1996		raise PatchError(_('unexpected delta opcode 0'))
	1997		return out
	1998
	1999		def applydiff(ui, fp, backend, store, strip=1, prefix='', eolmode='strict'):
	2000		"""Reads a patch from fp and tries to apply it.
	2001
	2002		Returns 0 for a clean patch, -1 if any rejects were found and 1 if
	2003		there was any fuzz.
	2004
	2005		If 'eolmode' is 'strict', the patch content and patched file are
	2006		read in binary mode. Otherwise, line endings are ignored when
	2007		patching then normalized according to 'eolmode'.
	2008		"""
	2009		return _applydiff(ui, fp, patchfile, backend, store, strip=strip,
	2010		prefix=prefix, eolmode=eolmode)
	2011
	2012		def _canonprefix(repo, prefix):
	2013		if prefix:
	2014		prefix = pathutil.canonpath(repo.root, repo.getcwd(), prefix)
	2015		if prefix != '':
	2016		prefix += '/'
	2017		return prefix
	2018
	2019		def _applydiff(ui, fp, patcher, backend, store, strip=1, prefix='',
	2020		eolmode='strict'):
	2021		prefix = _canonprefix(backend.repo, prefix)
	2022		def pstrip(p):
	2023		return pathtransform(p, strip - 1, prefix)[1]
	2024
	2025		rejects = 0
	2026		err = 0
	2027		current_file = None
	2028
	2029		for state, values in iterhunks(fp):
	2030		if state == 'hunk':
	2031		if not current_file:
	2032		continue
	2033		ret = current_file.apply(values)
	2034		if ret > 0:
	2035		err = 1
	2036		elif state == 'file':
	2037		if current_file:
	2038		rejects += current_file.close()
	2039		current_file = None
	2040		afile, bfile, first_hunk, gp = values
	2041		if gp:
	2042		gp.path = pstrip(gp.path)
	2043		if gp.oldpath:
	2044		gp.oldpath = pstrip(gp.oldpath)
	2045		else:
	2046		gp = makepatchmeta(backend, afile, bfile, first_hunk, strip,
	2047		prefix)
	2048		if gp.op == 'RENAME':
	2049		backend.unlink(gp.oldpath)
	2050		if not first_hunk:
	2051		if gp.op == 'DELETE':
	2052		backend.unlink(gp.path)
	2053		continue
	2054		data, mode = None, None
	2055		if gp.op in ('RENAME', 'COPY'):
	2056		data, mode = store.getfile(gp.oldpath)[:2]
	2057		if data is None:
	2058		# This means that the old path does not exist
	2059		raise PatchError(_("source file '%s' does not exist")
	2060		% gp.oldpath)
	2061		if gp.mode:
	2062		mode = gp.mode
	2063		if gp.op == 'ADD':
	2064		# Added files without content have no hunk and
	2065		# must be created
	2066		data = ''
	2067		if data or mode:
	2068		if (gp.op in ('ADD', 'RENAME', 'COPY')
	2069		and backend.exists(gp.path)):
	2070		raise PatchError(_("cannot create %s: destination "
	2071		"already exists") % gp.path)
	2072		backend.setfile(gp.path, data, mode, gp.oldpath)
	2073		continue
	2074		try:
	2075		current_file = patcher(ui, gp, backend, store,
	2076		eolmode=eolmode)
	2077		except PatchError as inst:
	2078		ui.warn(str(inst) + '\n')
	2079		current_file = None
	2080		rejects += 1
	2081		continue
	2082		elif state == 'git':
	2083		for gp in values:
	2084		path = pstrip(gp.oldpath)
	2085		data, mode = backend.getfile(path)
	2086		if data is None:
	2087		# The error ignored here will trigger a getfile()
	2088		# error in a place more appropriate for error
	2089		# handling, and will not interrupt the patching
	2090		# process.
	2091		pass
	2092		else:
	2093		store.setfile(path, data, mode)
	2094		else:
	2095		raise error.Abort(_('unsupported parser state: %s') % state)
	2096
	2097		if current_file:
	2098		rejects += current_file.close()
	2099
	2100		if rejects:
	2101		return -1
	2102		return err
	2103
	2104		def _externalpatch(ui, repo, patcher, patchname, strip, files,
	2105		similarity):
	2106		"""use <patcher> to apply <patchname> to the working directory.
	2107		returns whether patch was applied with fuzz factor."""
	2108
	2109		fuzz = False
	2110		args = []
	2111		cwd = repo.root
	2112		if cwd:
	2113		args.append('-d %s' % procutil.shellquote(cwd))
	2114		cmd = ('%s %s -p%d < %s'
	2115		% (patcher, ' '.join(args), strip, procutil.shellquote(patchname)))
	2116		ui.debug('Using external patch tool: %s\n' % cmd)
	2117		fp = procutil.popen(cmd, 'rb')
	2118		try:
	2119		for line in util.iterfile(fp):
	2120		line = line.rstrip()
	2121		ui.note(line + '\n')
	2122		if line.startswith('patching file '):
	2123		pf = util.parsepatchoutput(line)
	2124		printed_file = False
	2125		files.add(pf)
	2126		elif line.find('with fuzz') >= 0:
	2127		fuzz = True
	2128		if not printed_file:
	2129		ui.warn(pf + '\n')
	2130		printed_file = True
	2131		ui.warn(line + '\n')
	2132		elif line.find('saving rejects to file') >= 0:
	2133		ui.warn(line + '\n')
	2134		elif line.find('FAILED') >= 0:
	2135		if not printed_file:
	2136		ui.warn(pf + '\n')
	2137		printed_file = True
	2138		ui.warn(line + '\n')
	2139		finally:
	2140		if files:
	2141		scmutil.marktouched(repo, files, similarity)
	2142		code = fp.close()
	2143		if code:
	2144		raise PatchError(_("patch command failed: %s") %
	2145		procutil.explainexit(code))
	2146		return fuzz
	2147
	2148		def patchbackend(ui, backend, patchobj, strip, prefix, files=None,
	2149		eolmode='strict'):
	2150		if files is None:
	2151		files = set()
	2152		if eolmode is None:
	2153		eolmode = ui.config('patch', 'eol')
	2154		if eolmode.lower() not in eolmodes:
	2155		raise error.Abort(_('unsupported line endings type: %s') % eolmode)
	2156		eolmode = eolmode.lower()
	2157
	2158		store = filestore()
	2159		try:
	2160		fp = open(patchobj, 'rb')
	2161		except TypeError:
	2162		fp = patchobj
	2163		try:
	2164		ret = applydiff(ui, fp, backend, store, strip=strip, prefix=prefix,
	2165		eolmode=eolmode)
	2166		finally:
	2167		if fp != patchobj:
	2168		fp.close()
	2169		files.update(backend.close())
	2170		store.close()
	2171		if ret < 0:
	2172		raise PatchError(_('patch failed to apply'))
	2173		return ret > 0
	2174
	2175		def internalpatch(ui, repo, patchobj, strip, prefix='', files=None,
	2176		eolmode='strict', similarity=0):
	2177		"""use builtin patch to apply <patchobj> to the working directory.
	2178		returns whether patch was applied with fuzz factor."""
	2179		backend = workingbackend(ui, repo, similarity)
	2180		return patchbackend(ui, backend, patchobj, strip, prefix, files, eolmode)
	2181
	2182		def patchrepo(ui, repo, ctx, store, patchobj, strip, prefix, files=None,
	2183		eolmode='strict'):
	2184		backend = repobackend(ui, repo, ctx, store)
	2185		return patchbackend(ui, backend, patchobj, strip, prefix, files, eolmode)
	2186
	2187		def patch(ui, repo, patchname, strip=1, prefix='', files=None, eolmode='strict',
	2188		similarity=0):
	2189		"""Apply <patchname> to the working directory.
	2190
	2191		'eolmode' specifies how end of lines should be handled. It can be:
	2192		- 'strict': inputs are read in binary mode, EOLs are preserved
	2193		- 'crlf': EOLs are ignored when patching and reset to CRLF
	2194		- 'lf': EOLs are ignored when patching and reset to LF
	2195		- None: get it from user settings, default to 'strict'
	2196		'eolmode' is ignored when using an external patcher program.
	2197
	2198		Returns whether patch was applied with fuzz factor.
	2199		"""
	2200		patcher = ui.config('ui', 'patch')
	2201		if files is None:
	2202		files = set()
	2203		if patcher:
	2204		return _externalpatch(ui, repo, patcher, patchname, strip,
	2205		files, similarity)
	2206		return internalpatch(ui, repo, patchname, strip, prefix, files, eolmode,
	2207		similarity)
	2208
	2209		def changedfiles(ui, repo, patchpath, strip=1, prefix=''):
	2210		backend = fsbackend(ui, repo.root)
	2211		prefix = _canonprefix(repo, prefix)
	2212		with open(patchpath, 'rb') as fp:
	2213		changed = set()
	2214		for state, values in iterhunks(fp):
	2215		if state == 'file':
	2216		afile, bfile, first_hunk, gp = values
	2217		if gp:
	2218		gp.path = pathtransform(gp.path, strip - 1, prefix)[1]
	2219		if gp.oldpath:
	2220		gp.oldpath = pathtransform(gp.oldpath, strip - 1,
	2221		prefix)[1]
	2222		else:
	2223		gp = makepatchmeta(backend, afile, bfile, first_hunk, strip,
	2224		prefix)
	2225		changed.add(gp.path)
	2226		if gp.op == 'RENAME':
	2227		changed.add(gp.oldpath)
	2228		elif state not in ('hunk', 'git'):
	2229		raise error.Abort(_('unsupported parser state: %s') % state)
	2230		return changed
	2231
	2232		class GitDiffRequired(Exception):
	2233		pass
		14	from .. import (
		15	mdiff,
		16	pycompat,
		17	)
	2234	18
	2235	19	def diffallopts(ui, opts=None, untrusted=False, section='diff'):
	2236	20	'''return diffopts with all features supported and parsed'''
	2237	21	return difffeatureopts(ui, opts=opts, untrusted=untrusted, section=section,
	2238	22	git=True, whitespace=True, formatchanging=True)
	2239	23
	2240	24	diffopts = diffallopts
	2241	25
	2242	26	def difffeatureopts(ui, opts=None, untrusted=False, section='diff', git=False,
	2243	27	whitespace=False, formatchanging=False):
	2244	28	'''return diffopts with only opted-in features parsed
	2245	29
	2246	30	Features:
	2247	31	- git: git-style diffs
	2248	32	- whitespace: whitespace options like ignoreblanklines and ignorews
	2249	33	- formatchanging: options that will likely break or cause correctness issues
	2250	34	with most diff parsers
	2251	35	'''
	2252	36	def get(key, name=None, getter=ui.configbool, forceplain=None):
	2253	37	if opts:
	2254	38	v = opts.get(key)
	2255	39	# diffopts flags are either None-default (which is passed
	2256	40	# through unchanged, so we can identify unset values), or
	2257	41	# some other falsey default (eg --unified, which defaults
	2258	42	# to an empty string). We only want to override the config
	2259	43	# entries from hgrc with command line values if they
	2260	44	# appear to have been set, which is any truthy value,
	2261	45	# True, or False.
	2262	46	if v or isinstance(v, bool):
	2263	47	return v
	2264	48	if forceplain is not None and ui.plain():
	2265	49	return forceplain
	2266	50	return getter(section, name or key, untrusted=untrusted)
	2267	51
	2268	52	# core options, expected to be understood by every diff parser
	2269	53	buildopts = {
	2270	54	'nodates': get('nodates'),
	2271	55	'showfunc': get('show_function', 'showfunc'),
	2272	56	'context': get('unified', getter=ui.config),
	2273	57	}
	2274	58	buildopts['worddiff'] = ui.configbool('experimental', 'worddiff')
	2275	59	buildopts['xdiff'] = ui.configbool('experimental', 'xdiff')
	2276	60
	2277	61	if git:
	2278	62	buildopts['git'] = get('git')
	2279	63
	2280	64	# since this is in the experimental section, we need to call
	2281	65	# ui.configbool directory
	2282	66	buildopts['showsimilarity'] = ui.configbool('experimental',
	2283	67	'extendedheader.similarity')
	2284	68
	2285	69	# need to inspect the ui object instead of using get() since we want to
	2286	70	# test for an int
	2287	71	hconf = ui.config('experimental', 'extendedheader.index')
	2288	72	if hconf is not None:
	2289	73	hlen = None
	2290	74	try:
	2291	75	# the hash config could be an integer (for length of hash) or a
	2292	76	# word (e.g. short, full, none)
	2293	77	hlen = int(hconf)
	2294	78	if hlen < 0 or hlen > 40:
	2295	79	msg = _("invalid length for extendedheader.index: '%d'\n")
	2296	80	ui.warn(msg % hlen)
	2297	81	except ValueError:
	2298	82	# default value
	2299	83	if hconf == 'short' or hconf == '':
	2300	84	hlen = 12
	2301	85	elif hconf == 'full':
	2302	86	hlen = 40
	2303	87	elif hconf != 'none':
	2304	88	msg = _("invalid value for extendedheader.index: '%s'\n")
	2305	89	ui.warn(msg % hconf)
	2306	90	finally:
	2307	91	buildopts['index'] = hlen
	2308	92
	2309	93	if whitespace:
	2310	94	buildopts['ignorews'] = get('ignore_all_space', 'ignorews')
	2311	95	buildopts['ignorewsamount'] = get('ignore_space_change',
	2312	96	'ignorewsamount')
	2313	97	buildopts['ignoreblanklines'] = get('ignore_blank_lines',
	2314	98	'ignoreblanklines')
	2315	99	buildopts['ignorewseol'] = get('ignore_space_at_eol', 'ignorewseol')
	2316	100	if formatchanging:
	2317	101	buildopts['text'] = opts and opts.get('text')
	2318	102	binary = None if opts is None else opts.get('binary')
	2319	103	buildopts['nobinary'] = (not binary if binary is not None
	2320	104	else get('nobinary', forceplain=False))
	2321	105	buildopts['noprefix'] = get('noprefix', forceplain=False)
	2322	106
	2323	107	return mdiff.diffopts(**pycompat.strkwargs(buildopts))
	2324
	2325		def diff(repo, node1=None, node2=None, match=None, changes=None,
	2326		opts=None, losedatafn=None, prefix='', relroot='', copy=None,
	2327		hunksfilterfn=None):
	2328		'''yields diff of changes to files between two nodes, or node and
	2329		working directory.
	2330
	2331		if node1 is None, use first dirstate parent instead.
	2332		if node2 is None, compare node1 with working directory.
	2333
	2334		losedatafn(**kwarg) is a callable run when opts.upgrade=True and
	2335		every time some change cannot be represented with the current
	2336		patch format. Return False to upgrade to git patch format, True to
	2337		accept the loss or raise an exception to abort the diff. It is
	2338		called with the name of current file being diffed as 'fn'. If set
	2339		to None, patches will always be upgraded to git format when
	2340		necessary.
	2341
	2342		prefix is a filename prefix that is prepended to all filenames on
	2343		display (used for subrepos).
	2344
	2345		relroot, if not empty, must be normalized with a trailing /. Any match
	2346		patterns that fall outside it will be ignored.
	2347
	2348		copy, if not empty, should contain mappings {dst@y: src@x} of copy
	2349		information.
	2350
	2351		hunksfilterfn, if not None, should be a function taking a filectx and
	2352		hunks generator that may yield filtered hunks.
	2353		'''
	2354		for fctx1, fctx2, hdr, hunks in diffhunks(
	2355		repo, node1=node1, node2=node2,
	2356		match=match, changes=changes, opts=opts,
	2357		losedatafn=losedatafn, prefix=prefix, relroot=relroot, copy=copy,
	2358		):
	2359		if hunksfilterfn is not None:
	2360		# If the file has been removed, fctx2 is None; but this should
	2361		# not occur here since we catch removed files early in
	2362		# logcmdutil.getlinerangerevs() for 'hg log -L'.
	2363		assert fctx2 is not None, \
	2364		'fctx2 unexpectly None in diff hunks filtering'
	2365		hunks = hunksfilterfn(fctx2, hunks)
	2366		text = ''.join(sum((list(hlines) for hrange, hlines in hunks), []))
	2367		if hdr and (text or len(hdr) > 1):
	2368		yield '\n'.join(hdr) + '\n'
	2369		if text:
	2370		yield text
	2371
	2372		def diffhunks(repo, node1=None, node2=None, match=None, changes=None,
	2373		opts=None, losedatafn=None, prefix='', relroot='', copy=None):
	2374		"""Yield diff of changes to files in the form of (`header`, `hunks`) tuples
	2375		where `header` is a list of diff headers and `hunks` is an iterable of
	2376		(`hunkrange`, `hunklines`) tuples.
	2377
	2378		See diff() for the meaning of parameters.
	2379		"""
	2380
	2381		if opts is None:
	2382		opts = mdiff.defaultopts
	2383
	2384		if not node1 and not node2:
	2385		node1 = repo.dirstate.p1()
	2386
	2387		def lrugetfilectx():
	2388		cache = {}
	2389		order = collections.deque()
	2390		def getfilectx(f, ctx):
	2391		fctx = ctx.filectx(f, filelog=cache.get(f))
	2392		if f not in cache:
	2393		if len(cache) > 20:
	2394		del cache[order.popleft()]
	2395		cache[f] = fctx.filelog()
	2396		else:
	2397		order.remove(f)
	2398		order.append(f)
	2399		return fctx
	2400		return getfilectx
	2401		getfilectx = lrugetfilectx()
	2402
	2403		ctx1 = repo[node1]
	2404		ctx2 = repo[node2]
	2405
	2406		relfiltered = False
	2407		if relroot != '' and match.always():
	2408		# as a special case, create a new matcher with just the relroot
	2409		pats = [relroot]
	2410		match = scmutil.match(ctx2, pats, default='path')
	2411		relfiltered = True
	2412
	2413		if not changes:
	2414		changes = repo.status(ctx1, ctx2, match=match)
	2415		modified, added, removed = changes[:3]
	2416
	2417		if not modified and not added and not removed:
	2418		return []
	2419
	2420		if repo.ui.debugflag:
	2421		hexfunc = hex
	2422		else:
	2423		hexfunc = short
	2424		revs = [hexfunc(node) for node in [ctx1.node(), ctx2.node()] if node]
	2425
	2426		if copy is None:
	2427		copy = {}
	2428		if opts.git or opts.upgrade:
	2429		copy = copies.pathcopies(ctx1, ctx2, match=match)
	2430
	2431		if relroot is not None:
	2432		if not relfiltered:
	2433		# XXX this would ideally be done in the matcher, but that is
	2434		# generally meant to 'or' patterns, not 'and' them. In this case we
	2435		# need to 'and' all the patterns from the matcher with relroot.
	2436		def filterrel(l):
	2437		return [f for f in l if f.startswith(relroot)]
	2438		modified = filterrel(modified)
	2439		added = filterrel(added)
	2440		removed = filterrel(removed)
	2441		relfiltered = True
	2442		# filter out copies where either side isn't inside the relative root
	2443		copy = dict(((dst, src) for (dst, src) in copy.iteritems()
	2444		if dst.startswith(relroot)
	2445		and src.startswith(relroot)))
	2446
	2447		modifiedset = set(modified)
	2448		addedset = set(added)
	2449		removedset = set(removed)
	2450		for f in modified:
	2451		if f not in ctx1:
	2452		# Fix up added, since merged-in additions appear as
	2453		# modifications during merges
	2454		modifiedset.remove(f)
	2455		addedset.add(f)
	2456		for f in removed:
	2457		if f not in ctx1:
	2458		# Merged-in additions that are then removed are reported as removed.
	2459		# They are not in ctx1, so We don't want to show them in the diff.
	2460		removedset.remove(f)
	2461		modified = sorted(modifiedset)
	2462		added = sorted(addedset)
	2463		removed = sorted(removedset)
	2464		for dst, src in list(copy.items()):
	2465		if src not in ctx1:
	2466		# Files merged in during a merge and then copied/renamed are
	2467		# reported as copies. We want to show them in the diff as additions.
	2468		del copy[dst]
	2469
	2470		prefetchmatch = scmutil.matchfiles(
	2471		repo, list(modifiedset \| addedset \| removedset))
	2472		scmutil.prefetchfiles(repo, [ctx1.rev(), ctx2.rev()], prefetchmatch)
	2473
	2474		def difffn(opts, losedata):
	2475		return trydiff(repo, revs, ctx1, ctx2, modified, added, removed,
	2476		copy, getfilectx, opts, losedata, prefix, relroot)
	2477		if opts.upgrade and not opts.git:
	2478		try:
	2479		def losedata(fn):
	2480		if not losedatafn or not losedatafn(fn=fn):
	2481		raise GitDiffRequired
	2482		# Buffer the whole output until we are sure it can be generated
	2483		return list(difffn(opts.copy(git=False), losedata))
	2484		except GitDiffRequired:
	2485		return difffn(opts.copy(git=True), None)
	2486		else:
	2487		return difffn(opts, None)
	2488
	2489		def diffsinglehunk(hunklines):
	2490		"""yield tokens for a list of lines in a single hunk"""
	2491		for line in hunklines:
	2492		# chomp
	2493		chompline = line.rstrip('\n')
	2494		# highlight tabs and trailing whitespace
	2495		stripline = chompline.rstrip()
	2496		if line.startswith('-'):
	2497		label = 'diff.deleted'
	2498		elif line.startswith('+'):
	2499		label = 'diff.inserted'
	2500		else:
	2501		raise error.ProgrammingError('unexpected hunk line: %s' % line)
	2502		for token in tabsplitter.findall(stripline):
	2503		if token.startswith('\t'):
	2504		yield (token, 'diff.tab')
	2505		else:
	2506		yield (token, label)
	2507
	2508		if chompline != stripline:
	2509		yield (chompline[len(stripline):], 'diff.trailingwhitespace')
	2510		if chompline != line:
	2511		yield (line[len(chompline):], '')
	2512
	2513		def diffsinglehunkinline(hunklines):
	2514		"""yield tokens for a list of lines in a single hunk, with inline colors"""
	2515		# prepare deleted, and inserted content
	2516		a = ''
	2517		b = ''
	2518		for line in hunklines:
	2519		if line[0] == '-':
	2520		a += line[1:]
	2521		elif line[0] == '+':
	2522		b += line[1:]
	2523		else:
	2524		raise error.ProgrammingError('unexpected hunk line: %s' % line)
	2525		# fast path: if either side is empty, use diffsinglehunk
	2526		if not a or not b:
	2527		for t in diffsinglehunk(hunklines):
	2528		yield t
	2529		return
	2530		# re-split the content into words
	2531		al = wordsplitter.findall(a)
	2532		bl = wordsplitter.findall(b)
	2533		# re-arrange the words to lines since the diff algorithm is line-based
	2534		aln = [s if s == '\n' else s + '\n' for s in al]
	2535		bln = [s if s == '\n' else s + '\n' for s in bl]
	2536		an = ''.join(aln)
	2537		bn = ''.join(bln)
	2538		# run the diff algorithm, prepare atokens and btokens
	2539		atokens = []
	2540		btokens = []
	2541		blocks = mdiff.allblocks(an, bn, lines1=aln, lines2=bln)
	2542		for (a1, a2, b1, b2), btype in blocks:
	2543		changed = btype == '!'
	2544		for token in mdiff.splitnewlines(''.join(al[a1:a2])):
	2545		atokens.append((changed, token))
	2546		for token in mdiff.splitnewlines(''.join(bl[b1:b2])):
	2547		btokens.append((changed, token))
	2548
	2549		# yield deleted tokens, then inserted ones
	2550		for prefix, label, tokens in [('-', 'diff.deleted', atokens),
	2551		('+', 'diff.inserted', btokens)]:
	2552		nextisnewline = True
	2553		for changed, token in tokens:
	2554		if nextisnewline:
	2555		yield (prefix, label)
	2556		nextisnewline = False
	2557		# special handling line end
	2558		isendofline = token.endswith('\n')
	2559		if isendofline:
	2560		chomp = token[:-1] # chomp
	2561		token = chomp.rstrip() # detect spaces at the end
	2562		endspaces = chomp[len(token):]
	2563		# scan tabs
	2564		for maybetab in tabsplitter.findall(token):
	2565		if '\t' == maybetab[0]:
	2566		currentlabel = 'diff.tab'
	2567		else:
	2568		if changed:
	2569		currentlabel = label + '.changed'
	2570		else:
	2571		currentlabel = label + '.unchanged'
	2572		yield (maybetab, currentlabel)
	2573		if isendofline:
	2574		if endspaces:
	2575		yield (endspaces, 'diff.trailingwhitespace')
	2576		yield ('\n', '')
	2577		nextisnewline = True
	2578
	2579		def difflabel(func, args, *kw):
	2580		'''yields 2-tuples of (output, label) based on the output of func()'''
	2581		if kw.get(r'opts') and kw[r'opts'].worddiff:
	2582		dodiffhunk = diffsinglehunkinline
	2583		else:
	2584		dodiffhunk = diffsinglehunk
	2585		headprefixes = [('diff', 'diff.diffline'),
	2586		('copy', 'diff.extended'),
	2587		('rename', 'diff.extended'),
	2588		('old', 'diff.extended'),
	2589		('new', 'diff.extended'),
	2590		('deleted', 'diff.extended'),
	2591		('index', 'diff.extended'),
	2592		('similarity', 'diff.extended'),
	2593		('---', 'diff.file_a'),
	2594		('+++', 'diff.file_b')]
	2595		textprefixes = [('@', 'diff.hunk'),
	2596		# - and + are handled by diffsinglehunk
	2597		]
	2598		head = False
	2599
	2600		# buffers a hunk, i.e. adjacent "-", "+" lines without other changes.
	2601		hunkbuffer = []
	2602		def consumehunkbuffer():
	2603		if hunkbuffer:
	2604		for token in dodiffhunk(hunkbuffer):
	2605		yield token
	2606		hunkbuffer[:] = []
	2607
	2608		for chunk in func(args, *kw):
	2609		lines = chunk.split('\n')
	2610		linecount = len(lines)
	2611		for i, line in enumerate(lines):
	2612		if head:
	2613		if line.startswith('@'):
	2614		head = False
	2615		else:
	2616		if line and not line.startswith((' ', '+', '-', '@', '\\')):
	2617		head = True
	2618		diffline = False
	2619		if not head and line and line.startswith(('+', '-')):
	2620		diffline = True
	2621
	2622		prefixes = textprefixes
	2623		if head:
	2624		prefixes = headprefixes
	2625		if diffline:
	2626		# buffered
	2627		bufferedline = line
	2628		if i + 1 < linecount:
	2629		bufferedline += "\n"
	2630		hunkbuffer.append(bufferedline)
	2631		else:
	2632		# unbuffered
	2633		for token in consumehunkbuffer():
	2634		yield token
	2635		stripline = line.rstrip()
	2636		for prefix, label in prefixes:
	2637		if stripline.startswith(prefix):
	2638		yield (stripline, label)
	2639		if line != stripline:
	2640		yield (line[len(stripline):],
	2641		'diff.trailingwhitespace')
	2642		break
	2643		else:
	2644		yield (line, '')
	2645		if i + 1 < linecount:
	2646		yield ('\n', '')
	2647		for token in consumehunkbuffer():
	2648		yield token
	2649
	2650		def diffui(args, *kw):
	2651		'''like diff(), but yields 2-tuples of (output, label) for ui.write()'''
	2652		return difflabel(diff, args, *kw)
	2653
	2654		def _filepairs(modified, added, removed, copy, opts):
	2655		'''generates tuples (f1, f2, copyop), where f1 is the name of the file
	2656		before and f2 is the the name after. For added files, f1 will be None,
	2657		and for removed files, f2 will be None. copyop may be set to None, 'copy'
	2658		or 'rename' (the latter two only if opts.git is set).'''
	2659		gone = set()
	2660
	2661		copyto = dict([(v, k) for k, v in copy.items()])
	2662
	2663		addedset, removedset = set(added), set(removed)
	2664
	2665		for f in sorted(modified + added + removed):
	2666		copyop = None
	2667		f1, f2 = f, f
	2668		if f in addedset:
	2669		f1 = None
	2670		if f in copy:
	2671		if opts.git:
	2672		f1 = copy[f]
	2673		if f1 in removedset and f1 not in gone:
	2674		copyop = 'rename'
	2675		gone.add(f1)
	2676		else:
	2677		copyop = 'copy'
	2678		elif f in removedset:
	2679		f2 = None
	2680		if opts.git:
	2681		# have we already reported a copy above?
	2682		if (f in copyto and copyto[f] in addedset
	2683		and copy[copyto[f]] == f):
	2684		continue
	2685		yield f1, f2, copyop
	2686
	2687		def trydiff(repo, revs, ctx1, ctx2, modified, added, removed,
	2688		copy, getfilectx, opts, losedatafn, prefix, relroot):
	2689		'''given input data, generate a diff and yield it in blocks
	2690
	2691		If generating a diff would lose data like flags or binary data and
	2692		losedatafn is not None, it will be called.
	2693
	2694		relroot is removed and prefix is added to every path in the diff output.
	2695
	2696		If relroot is not empty, this function expects every path in modified,
	2697		added, removed and copy to start with it.'''
	2698
	2699		def gitindex(text):
	2700		if not text:
	2701		text = ""
	2702		l = len(text)
	2703		s = hashlib.sha1('blob %d\0' % l)
	2704		s.update(text)
	2705		return hex(s.digest())
	2706
	2707		if opts.noprefix:
	2708		aprefix = bprefix = ''
	2709		else:
	2710		aprefix = 'a/'
	2711		bprefix = 'b/'
	2712
	2713		def diffline(f, revs):
	2714		revinfo = ' '.join(["-r %s" % rev for rev in revs])
	2715		return 'diff %s %s' % (revinfo, f)
	2716
	2717		def isempty(fctx):
	2718		return fctx is None or fctx.size() == 0
	2719
	2720		date1 = dateutil.datestr(ctx1.date())
	2721		date2 = dateutil.datestr(ctx2.date())
	2722
	2723		gitmode = {'l': '120000', 'x': '100755', '': '100644'}
	2724
	2725		if relroot != '' and (repo.ui.configbool('devel', 'all-warnings')
	2726		or repo.ui.configbool('devel', 'check-relroot')):
	2727		for f in modified + added + removed + list(copy) + list(copy.values()):
	2728		if f is not None and not f.startswith(relroot):
	2729		raise AssertionError(
	2730		"file %s doesn't start with relroot %s" % (f, relroot))
	2731
	2732		for f1, f2, copyop in _filepairs(modified, added, removed, copy, opts):
	2733		content1 = None
	2734		content2 = None
	2735		fctx1 = None
	2736		fctx2 = None
	2737		flag1 = None
	2738		flag2 = None
	2739		if f1:
	2740		fctx1 = getfilectx(f1, ctx1)
	2741		if opts.git or losedatafn:
	2742		flag1 = ctx1.flags(f1)
	2743		if f2:
	2744		fctx2 = getfilectx(f2, ctx2)
	2745		if opts.git or losedatafn:
	2746		flag2 = ctx2.flags(f2)
	2747		# if binary is True, output "summary" or "base85", but not "text diff"
	2748		if opts.text:
	2749		binary = False
	2750		else:
	2751		binary = any(f.isbinary() for f in [fctx1, fctx2] if f is not None)
	2752
	2753		if losedatafn and not opts.git:
	2754		if (binary or
	2755		# copy/rename
	2756		f2 in copy or
	2757		# empty file creation
	2758		(not f1 and isempty(fctx2)) or
	2759		# empty file deletion
	2760		(isempty(fctx1) and not f2) or
	2761		# create with flags
	2762		(not f1 and flag2) or
	2763		# change flags
	2764		(f1 and f2 and flag1 != flag2)):
	2765		losedatafn(f2 or f1)
	2766
	2767		path1 = f1 or f2
	2768		path2 = f2 or f1
	2769		path1 = posixpath.join(prefix, path1[len(relroot):])
	2770		path2 = posixpath.join(prefix, path2[len(relroot):])
	2771		header = []
	2772		if opts.git:
	2773		header.append('diff --git %s%s %s%s' %
	2774		(aprefix, path1, bprefix, path2))
	2775		if not f1: # added
	2776		header.append('new file mode %s' % gitmode[flag2])
	2777		elif not f2: # removed
	2778		header.append('deleted file mode %s' % gitmode[flag1])
	2779		else: # modified/copied/renamed
	2780		mode1, mode2 = gitmode[flag1], gitmode[flag2]
	2781		if mode1 != mode2:
	2782		header.append('old mode %s' % mode1)
	2783		header.append('new mode %s' % mode2)
	2784		if copyop is not None:
	2785		if opts.showsimilarity:
	2786		sim = similar.score(ctx1[path1], ctx2[path2]) * 100
	2787		header.append('similarity index %d%%' % sim)
	2788		header.append('%s from %s' % (copyop, path1))
	2789		header.append('%s to %s' % (copyop, path2))
	2790		elif revs and not repo.ui.quiet:
	2791		header.append(diffline(path1, revs))
	2792
	2793		# fctx.is \| diffopts \| what to \| is fctx.data()
	2794		# binary() \| text nobinary git index \| output? \| outputted?
	2795		# ------------------------------------\|----------------------------
	2796		# yes \| no no no * \| summary \| no
	2797		# yes \| no no yes * \| base85 \| yes
	2798		# yes \| no yes no * \| summary \| no
	2799		# yes \| no yes yes 0 \| summary \| no
	2800		# yes \| no yes yes >0 \| summary \| semi [1]
	2801		# yes \| yes * * * \| text diff \| yes
	2802		# no \| * * * * \| text diff \| yes
	2803		# [1]: hash(fctx.data()) is outputted. so fctx.data() cannot be faked
	2804		if binary and (not opts.git or (opts.git and opts.nobinary and not
	2805		opts.index)):
	2806		# fast path: no binary content will be displayed, content1 and
	2807		# content2 are only used for equivalent test. cmp() could have a
	2808		# fast path.
	2809		if fctx1 is not None:
	2810		content1 = b'\0'
	2811		if fctx2 is not None:
	2812		if fctx1 is not None and not fctx1.cmp(fctx2):
	2813		content2 = b'\0' # not different
	2814		else:
	2815		content2 = b'\0\0'
	2816		else:
	2817		# normal path: load contents
	2818		if fctx1 is not None:
	2819		content1 = fctx1.data()
	2820		if fctx2 is not None:
	2821		content2 = fctx2.data()
	2822
	2823		if binary and opts.git and not opts.nobinary:
	2824		text = mdiff.b85diff(content1, content2)
	2825		if text:
	2826		header.append('index %s..%s' %
	2827		(gitindex(content1), gitindex(content2)))
	2828		hunks = (None, [text]),
	2829		else:
	2830		if opts.git and opts.index > 0:
	2831		flag = flag1
	2832		if flag is None:
	2833		flag = flag2
	2834		header.append('index %s..%s %s' %
	2835		(gitindex(content1)[0:opts.index],
	2836		gitindex(content2)[0:opts.index],
	2837		gitmode[flag]))
	2838
	2839		uheaders, hunks = mdiff.unidiff(content1, date1,
	2840		content2, date2,
	2841		path1, path2,
	2842		binary=binary, opts=opts)
	2843		header.extend(uheaders)
	2844		yield fctx1, fctx2, header, hunks
	2845
	2846		def diffstatsum(stats):
	2847		maxfile, maxtotal, addtotal, removetotal, binary = 0, 0, 0, 0, False
	2848		for f, a, r, b in stats:
	2849		maxfile = max(maxfile, encoding.colwidth(f))
	2850		maxtotal = max(maxtotal, a + r)
	2851		addtotal += a
	2852		removetotal += r
	2853		binary = binary or b
	2854
	2855		return maxfile, maxtotal, addtotal, removetotal, binary
	2856
	2857		def diffstatdata(lines):
	2858		diffre = re.compile('^diff .-r [a-z0-9]+\s(.)$')
	2859
	2860		results = []
	2861		filename, adds, removes, isbinary = None, 0, 0, False
	2862
	2863		def addresult():
	2864		if filename:
	2865		results.append((filename, adds, removes, isbinary))
	2866
	2867		# inheader is used to track if a line is in the
	2868		# header portion of the diff. This helps properly account
	2869		# for lines that start with '--' or '++'
	2870		inheader = False
	2871
	2872		for line in lines:
	2873		if line.startswith('diff'):
	2874		addresult()
	2875		# starting a new file diff
	2876		# set numbers to 0 and reset inheader
	2877		inheader = True
	2878		adds, removes, isbinary = 0, 0, False
	2879		if line.startswith('diff --git a/'):
	2880		filename = gitre.search(line).group(2)
	2881		elif line.startswith('diff -r'):
	2882		# format: "diff -r ... -r ... filename"
	2883		filename = diffre.search(line).group(1)
	2884		elif line.startswith('@@'):
	2885		inheader = False
	2886		elif line.startswith('+') and not inheader:
	2887		adds += 1
	2888		elif line.startswith('-') and not inheader:
	2889		removes += 1
	2890		elif (line.startswith('GIT binary patch') or
	2891		line.startswith('Binary file')):
	2892		isbinary = True
	2893		addresult()
	2894		return results
	2895
	2896		def diffstat(lines, width=80):
	2897		output = []
	2898		stats = diffstatdata(lines)
	2899		maxname, maxtotal, totaladds, totalremoves, hasbinary = diffstatsum(stats)
	2900
	2901		countwidth = len(str(maxtotal))
	2902		if hasbinary and countwidth < 3:
	2903		countwidth = 3
	2904		graphwidth = width - countwidth - maxname - 6
	2905		if graphwidth < 10:
	2906		graphwidth = 10
	2907
	2908		def scale(i):
	2909		if maxtotal <= graphwidth:
	2910		return i
	2911		# If diffstat runs out of room it doesn't print anything,
	2912		# which isn't very useful, so always print at least one + or -
	2913		# if there were at least some changes.
	2914		return max(i * graphwidth // maxtotal, int(bool(i)))
	2915
	2916		for filename, adds, removes, isbinary in stats:
	2917		if isbinary:
	2918		count = 'Bin'
	2919		else:
	2920		count = '%d' % (adds + removes)
	2921		pluses = '+' * scale(adds)
	2922		minuses = '-' * scale(removes)
	2923		output.append(' %s%s \| %*s %s%s\n' %
	2924		(filename, ' ' * (maxname - encoding.colwidth(filename)),
	2925		countwidth, count, pluses, minuses))
	2926
	2927		if stats:
	2928		output.append(_(' %d files changed, %d insertions(+), '
	2929		'%d deletions(-)\n')
	2930		% (len(stats), totaladds, totalremoves))
	2931
	2932		return ''.join(output)
	2933
	2934		def diffstatui(args, *kw):
	2935		'''like diffstat(), but yields 2-tuples of (output, label) for
	2936		ui.write()
	2937		'''
	2938
	2939		for line in diffstat(args, *kw).splitlines():
	2940		if line and line[-1] in '+-':
	2941		name, graph = line.rsplit(' ', 1)
	2942		yield (name + ' ', '')
	2943		m = re.search(br'\++', graph)
	2944		if m:
	2945		yield (m.group(0), 'diffstat.inserted')
	2946		m = re.search(br'-+', graph)
	2947		if m:
	2948		yield (m.group(0), 'diffstat.deleted')
	2949		else:
	2950		yield (line, '')
	2951		yield ('\n', '')

General Comments 0

Write
Preview

You need to be logged in to leave comments. Login now

No TODOs yet

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages