upstream/mercurial-mirror Files · mercurial/mdiff.py

Fix revlog-ng interaction with old-http....

Fix revlog-ng interaction with old-http. revlog.py wasn't trying to detect the version of a revlog file that doesn't exist on the filesystem (as is the case with old-http). Additionally, there was an off-by-one error in httprangereader.read (ranges in HTTP Range headers are inclusive), making it get more data than what was asked for. This made a struct.unpack complain that "unpack str size does not match format". Finally, with the two fixes above, test-static-http fails, since BaseHTTPServer doesn't understand ranges and returns too much data. Work around that by reading only the specified amount.

mason@suse.com - - Load All Authors

File last commit:

r2078:441ea218 default


                r2138:f5046cab

default

Download file

             mdiff.py
        
                    196 lines
            
             | 6.0 KiB
            
                | text/x-python
            
             |
                PythonLexer
            
             / mercurial / mdiff.py
          
                    History
                
                 |
                  Source
                 | Raw
                 |Copy content
                 |Copy permalink

        mpm@selenic.com
    
mdiff.py: kill #! line, add copyright notice...

              r239
            
      # mdiff.py - diff and patch routines for mercurial

      #

      # Copyright 2005 Matt Mackall <mpm@selenic.com>

      #

      # This software may be used and distributed according to the terms

      # of the GNU General Public License, incorporated herein by reference.

        mason@suse.com
    
Add new bdiff based unidiff generation.

              r1637
            
      from demandload import demandload

      import struct, bdiff, util, mpatch

      demandload(globals(), "re")

        mpm@selenic.com
    
Add back links from file revisions to changeset revisions...

              r0
            
        mason@suse.com
    
Add new bdiff based unidiff generation.

              r1637
            
      def unidiff(a, ad, b, bd, fn, r=None, text=False,

                  showfunc=False, ignorews=False):

        Thomas Arendsen Hein
    
Show revisions in diffs like CVS, based on a patch from Goffredo Baroncelli....

              r396
            
        mpm@selenic.com
    
unidiff: punt on comparing empty files

              r35
            
          if not a and not b: return ""

        Matt Mackall
    
Clean up mdiff imports

              r1379
            
          epoch = util.datestr((0, 0))

        mpm@selenic.com
    
Attempt to make diff deal with null sources properly...

              r264
            
        Matt Mackall
    
Clean up mdiff imports

              r1379
            
          if not text and (util.binary(a) or util.binary(b)):

        mpm@selenic.com
    
Add automatic binary file detection to diff and export...

              r1015
            
              l = ['Binary file %s has changed\n' % fn]

        Thomas Arendsen Hein
    
Fix diff against an empty file (issue124) and add a test for this.

              r1723
            
          elif not a:

        mpm@selenic.com
    
Attempt to make diff deal with null sources properly...

              r264
            
              b = b.splitlines(1)

        Thomas Arendsen Hein
    
Fix diff against an empty file (issue124) and add a test for this.

              r1723
            
              if a is None:

                  l1 = "--- %s\t%s\n" % ("/dev/null", epoch)

              else:

                  l1 = "--- %s\t%s\n" % ("a/" + fn, ad)

        mpm@selenic.com
    
Attempt to make diff deal with null sources properly...

              r264
            
              l2 = "+++ %s\t%s\n" % ("b/" + fn, bd)

              l3 = "@@ -0,0 +1,%d @@\n" % len(b)

              l = [l1, l2, l3] + ["+" + e for e in b]

        Thomas Arendsen Hein
    
Fix diff against an empty file (issue124) and add a test for this.

              r1723
            
          elif not b:

        mpm@selenic.com
    
Attempt to make diff deal with null sources properly...

              r264
            
              a = a.splitlines(1)

              l1 = "--- %s\t%s\n" % ("a/" + fn, ad)

        Thomas Arendsen Hein
    
Fix diff against an empty file (issue124) and add a test for this.

              r1723
            
              if b is None:

                  l2 = "+++ %s\t%s\n" % ("/dev/null", epoch)

              else:

                  l2 = "+++ %s\t%s\n" % ("b/" + fn, bd)

        mpm@selenic.com
    
Attempt to make diff deal with null sources properly...

              r264
            
              l3 = "@@ -1,%d +0,0 @@\n" % len(a)

              l = [l1, l2, l3] + ["-" + e for e in a]

          else:

        mason@suse.com
    
Add new bdiff based unidiff generation.

              r1637
            
              al = a.splitlines(1)

              bl = b.splitlines(1)

              l = list(bunidiff(a, b, al, bl, "a/" + fn, "b/" + fn,

                                showfunc=showfunc, ignorews=ignorews))

        mpm@selenic.com
    
unidiff: handle empty diffs more gracefully...

              r278
            
              if not l: return ""

        mpm@selenic.com
    
diff: use tab to separate date from filename...

              r272
            
              # difflib uses a space, rather than a tab

        twaldmann@thinkmo.de
    
minor optimization: save some string trash

              r1540
            
              l[0] = "%s\t%s\n" % (l[0][:-2], ad)

              l[1] = "%s\t%s\n" % (l[1][:-2], bd)

        mpm@selenic.com
    
hg diff: fix missing final newline bug

              r170
            
          for ln in xrange(len(l)):

              if l[ln][-1] != '\n':

                  l[ln] += "\n\ No newline at end of file\n"

        Thomas Arendsen Hein
    
Show revisions in diffs like CVS, based on a patch from Goffredo Baroncelli....

              r396
            
          if r:

              l.insert(0, "diff %s %s\n" %

                          (' '.join(["-r %s" % rev for rev in r]), fn))

        mpm@selenic.com
    
Add back links from file revisions to changeset revisions...

              r0
            
          return "".join(l)

        mason@suse.com
    
Add new bdiff based unidiff generation.

              r1637
            
      # somewhat self contained replacement for difflib.unified_diff

      # t1 and t2 are the text to be diffed

      # l1 and l2 are the text broken up into lines

      # header1 and header2 are the filenames for the diff output

      # context is the number of context lines

      # showfunc enables diff -p output

      # ignorews ignores all whitespace changes in the diff

      def bunidiff(t1, t2, l1, l2, header1, header2, context=3, showfunc=False,

                   ignorews=False):

          def contextend(l, len):

              ret = l + context

              if ret > len:

                  ret = len

              return ret

          def contextstart(l):

              ret = l - context

              if ret < 0:

                  return 0

              return ret

          def yieldhunk(hunk, header):

              if header:

                  for x in header:

                      yield x

              (astart, a2, bstart, b2, delta) = hunk

              aend = contextend(a2, len(l1))

              alen = aend - astart

              blen = b2 - bstart + aend - a2

              func = ""

              if showfunc:

                  # walk backwards from the start of the context

                  # to find a line starting with an alphanumeric char.

                  for x in xrange(astart, -1, -1):

                      t = l1[x].rstrip()

                      if funcre.match(t):

                          func = ' ' + t[:40]

                          break

              yield "@@ -%d,%d +%d,%d @@%s\n" % (astart + 1, alen,

                                                 bstart + 1, blen, func)

              for x in delta:

                  yield x

              for x in xrange(a2, aend):

                  yield ' ' + l1[x]

          header = [ "--- %s\t\n" % header1, "+++ %s\t\n" % header2 ]

          if showfunc:

              funcre = re.compile('\w')

          if ignorews:

              wsre = re.compile('[ \t]')

          # bdiff.blocks gives us the matching sequences in the files.  The loop

          # below finds the spaces between those matching sequences and translates

          # them into diff output.

          #

          diff = bdiff.blocks(t1, t2)

          hunk = None

          for i in xrange(len(diff)):

              # The first match is special.

              # we've either found a match starting at line 0 or a match later

              # in the file.  If it starts later, old and new below will both be

              # empty and we'll continue to the next match.

              if i > 0:

                  s = diff[i-1]

              else:

                  s = [0, 0, 0, 0]

              delta = []

              s1 = diff[i]

              a1 = s[1]

              a2 = s1[0]

              b1 = s[3]

              b2 = s1[2]

              old = l1[a1:a2]

              new = l2[b1:b2]

              # bdiff sometimes gives huge matches past eof, this check eats them,

              # and deals with the special first match case described above

              if not old and not new:

                  continue

              if ignorews:

                  wsold = wsre.sub('', "".join(old))

                  wsnew = wsre.sub('', "".join(new))

                  if wsold == wsnew:

                      continue

              astart = contextstart(a1)

              bstart = contextstart(b1)

              prev = None

              if hunk:

                  # join with the previous hunk if it falls inside the context

                  if astart < hunk[1] + context + 1:

                      prev = hunk

                      astart = hunk[1]

                      bstart = hunk[3]

                  else:

                      for x in yieldhunk(hunk, header):

                          yield x

                      # we only want to yield the header if the files differ, and

                      # we only want to yield it once.

                      header = None

              if prev:

                  # we've joined the previous hunk, record the new ending points.

                  hunk[1] = a2

                  hunk[3] = b2

                  delta = hunk[4]

              else:

                  # create a new hunk

                  hunk = [ astart, a2, bstart, b2, delta ]

              delta[len(delta):] = [ ' ' + x for x in l1[astart:a1] ]

              delta[len(delta):] = [ '-' + x for x in old ]

              delta[len(delta):] = [ '+' + x for x in new ]

          if hunk:

              for x in yieldhunk(hunk, header):

                  yield x

        mpm@selenic.com
    
Add a function to return the new text from a binary diff

              r120
            
      def patchtext(bin):

          pos = 0

          t = []

          while pos < len(bin):

              p1, p2, l = struct.unpack(">lll", bin[pos:pos + 12])

              pos += 12

              t.append(bin[pos:pos + l])

              pos += l

          return "".join(t)

        mpm@selenic.com
    
Add back links from file revisions to changeset revisions...

              r0
            
      def patch(a, bin):

        Matt Mackall
    
Clean up mdiff imports

              r1379
            
          return mpatch.patches(a, [bin])

        mpm@selenic.com
    
Start using bdiff for generating deltas...

              r432
            
        Matt Mackall
    
Clean up mdiff imports

              r1379
            
      patches = mpatch.patches

        mason@suse.com
    
Fill in the uncompressed size during revlog.addgroup...

              r2078
            
      patchedsize = mpatch.patchedsize

        mpm@selenic.com
    
Start using bdiff for generating deltas...

              r432
            
      textdiff = bdiff.bdiff

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages

mpm@selenic.com mdiff.py: kill #! line, add copyright notice...	r239	# mdiff.py - diff and patch routines for mercurial
		#
		# Copyright 2005 Matt Mackall <mpm@selenic.com>
		#
		# This software may be used and distributed according to the terms
		# of the GNU General Public License, incorporated herein by reference.

mason@suse.com Add new bdiff based unidiff generation.	r1637	from demandload import demandload
		import struct, bdiff, util, mpatch
		demandload(globals(), "re")
mpm@selenic.com Add back links from file revisions to changeset revisions...	r0
mason@suse.com Add new bdiff based unidiff generation.	r1637
		def unidiff(a, ad, b, bd, fn, r=None, text=False,
		showfunc=False, ignorews=False):
Thomas Arendsen Hein Show revisions in diffs like CVS, based on a patch from Goffredo Baroncelli....	r396
mpm@selenic.com unidiff: punt on comparing empty files	r35	if not a and not b: return ""
Matt Mackall Clean up mdiff imports	r1379	epoch = util.datestr((0, 0))
mpm@selenic.com Attempt to make diff deal with null sources properly...	r264
Matt Mackall Clean up mdiff imports	r1379	if not text and (util.binary(a) or util.binary(b)):
mpm@selenic.com Add automatic binary file detection to diff and export...	r1015	l = ['Binary file %s has changed\n' % fn]
Thomas Arendsen Hein Fix diff against an empty file (issue124) and add a test for this.	r1723	elif not a:
mpm@selenic.com Attempt to make diff deal with null sources properly...	r264	b = b.splitlines(1)
Thomas Arendsen Hein Fix diff against an empty file (issue124) and add a test for this.	r1723	if a is None:
		l1 = "--- %s\t%s\n" % ("/dev/null", epoch)
		else:
		l1 = "--- %s\t%s\n" % ("a/" + fn, ad)
mpm@selenic.com Attempt to make diff deal with null sources properly...	r264	l2 = "+++ %s\t%s\n" % ("b/" + fn, bd)
		l3 = "@@ -0,0 +1,%d @@\n" % len(b)
		l = [l1, l2, l3] + ["+" + e for e in b]
Thomas Arendsen Hein Fix diff against an empty file (issue124) and add a test for this.	r1723	elif not b:
mpm@selenic.com Attempt to make diff deal with null sources properly...	r264	a = a.splitlines(1)
		l1 = "--- %s\t%s\n" % ("a/" + fn, ad)
Thomas Arendsen Hein Fix diff against an empty file (issue124) and add a test for this.	r1723	if b is None:
		l2 = "+++ %s\t%s\n" % ("/dev/null", epoch)
		else:
		l2 = "+++ %s\t%s\n" % ("b/" + fn, bd)
mpm@selenic.com Attempt to make diff deal with null sources properly...	r264	l3 = "@@ -1,%d +0,0 @@\n" % len(a)
		l = [l1, l2, l3] + ["-" + e for e in a]
		else:
mason@suse.com Add new bdiff based unidiff generation.	r1637	al = a.splitlines(1)
		bl = b.splitlines(1)
		l = list(bunidiff(a, b, al, bl, "a/" + fn, "b/" + fn,
		showfunc=showfunc, ignorews=ignorews))
mpm@selenic.com unidiff: handle empty diffs more gracefully...	r278	if not l: return ""
mpm@selenic.com diff: use tab to separate date from filename...	r272	# difflib uses a space, rather than a tab
twaldmann@thinkmo.de minor optimization: save some string trash	r1540	l[0] = "%s\t%s\n" % (l[0][:-2], ad)
		l[1] = "%s\t%s\n" % (l[1][:-2], bd)
mpm@selenic.com hg diff: fix missing final newline bug	r170
		for ln in xrange(len(l)):
		if l[ln][-1] != '\n':
		l[ln] += "\n\ No newline at end of file\n"

Thomas Arendsen Hein Show revisions in diffs like CVS, based on a patch from Goffredo Baroncelli....	r396	if r:
		l.insert(0, "diff %s %s\n" %
		(' '.join(["-r %s" % rev for rev in r]), fn))

mpm@selenic.com Add back links from file revisions to changeset revisions...	r0	return "".join(l)

mason@suse.com Add new bdiff based unidiff generation.	r1637	# somewhat self contained replacement for difflib.unified_diff
		# t1 and t2 are the text to be diffed
		# l1 and l2 are the text broken up into lines
		# header1 and header2 are the filenames for the diff output
		# context is the number of context lines
		# showfunc enables diff -p output
		# ignorews ignores all whitespace changes in the diff
		def bunidiff(t1, t2, l1, l2, header1, header2, context=3, showfunc=False,
		ignorews=False):
		def contextend(l, len):
		ret = l + context
		if ret > len:
		ret = len
		return ret

		def contextstart(l):
		ret = l - context
		if ret < 0:
		return 0
		return ret

		def yieldhunk(hunk, header):
		if header:
		for x in header:
		yield x
		(astart, a2, bstart, b2, delta) = hunk
		aend = contextend(a2, len(l1))
		alen = aend - astart
		blen = b2 - bstart + aend - a2

		func = ""
		if showfunc:
		# walk backwards from the start of the context
		# to find a line starting with an alphanumeric char.
		for x in xrange(astart, -1, -1):
		t = l1[x].rstrip()
		if funcre.match(t):
		func = ' ' + t[:40]
		break

		yield "@@ -%d,%d +%d,%d @@%s\n" % (astart + 1, alen,
		bstart + 1, blen, func)
		for x in delta:
		yield x
		for x in xrange(a2, aend):
		yield ' ' + l1[x]

		header = [ "--- %s\t\n" % header1, "+++ %s\t\n" % header2 ]

		if showfunc:
		funcre = re.compile('\w')
		if ignorews:
		wsre = re.compile('[ \t]')

		# bdiff.blocks gives us the matching sequences in the files. The loop
		# below finds the spaces between those matching sequences and translates
		# them into diff output.
		#
		diff = bdiff.blocks(t1, t2)
		hunk = None
		for i in xrange(len(diff)):
		# The first match is special.
		# we've either found a match starting at line 0 or a match later
		# in the file. If it starts later, old and new below will both be
		# empty and we'll continue to the next match.
		if i > 0:
		s = diff[i-1]
		else:
		s = [0, 0, 0, 0]
		delta = []
		s1 = diff[i]
		a1 = s[1]
		a2 = s1[0]
		b1 = s[3]
		b2 = s1[2]

		old = l1[a1:a2]
		new = l2[b1:b2]

		# bdiff sometimes gives huge matches past eof, this check eats them,
		# and deals with the special first match case described above
		if not old and not new:
		continue

		if ignorews:
		wsold = wsre.sub('', "".join(old))
		wsnew = wsre.sub('', "".join(new))
		if wsold == wsnew:
		continue

		astart = contextstart(a1)
		bstart = contextstart(b1)
		prev = None
		if hunk:
		# join with the previous hunk if it falls inside the context
		if astart < hunk[1] + context + 1:
		prev = hunk
		astart = hunk[1]
		bstart = hunk[3]
		else:
		for x in yieldhunk(hunk, header):
		yield x
		# we only want to yield the header if the files differ, and
		# we only want to yield it once.
		header = None
		if prev:
		# we've joined the previous hunk, record the new ending points.
		hunk[1] = a2
		hunk[3] = b2
		delta = hunk[4]
		else:
		# create a new hunk
		hunk = [ astart, a2, bstart, b2, delta ]

		delta[len(delta):] = [ ' ' + x for x in l1[astart:a1] ]
		delta[len(delta):] = [ '-' + x for x in old ]
		delta[len(delta):] = [ '+' + x for x in new ]

		if hunk:
		for x in yieldhunk(hunk, header):
		yield x

mpm@selenic.com Add a function to return the new text from a binary diff	r120	def patchtext(bin):
		pos = 0
		t = []
		while pos < len(bin):
		p1, p2, l = struct.unpack(">lll", bin[pos:pos + 12])
		pos += 12
		t.append(bin[pos:pos + l])
		pos += l
		return "".join(t)

mpm@selenic.com Add back links from file revisions to changeset revisions...	r0	def patch(a, bin):
Matt Mackall Clean up mdiff imports	r1379	return mpatch.patches(a, [bin])
mpm@selenic.com Start using bdiff for generating deltas...	r432
Matt Mackall Clean up mdiff imports	r1379	patches = mpatch.patches
mason@suse.com Fill in the uncompressed size during revlog.addgroup...	r2078	patchedsize = mpatch.patchedsize
mpm@selenic.com Start using bdiff for generating deltas...	r432	textdiff = bdiff.bdiff