upstream/mercurial-mirror Commit - r1644:e7e6504c

Remove duplicate bunidiff code from hgdiff, importing from mdiff.py instead

mason@suse.com -

r1644:e7e6504c default

parent child

contrib/hgdiff

0 +1 -121

              #!/usr/bin/env python
              import os, sys, struct, stat
              import difflib
              import re
              from optparse import OptionParser
              from mercurial.bdiff import bdiff, blocks
+             from mercurial.mdiff import bunidiff
              VERSION="0.2"
              usage = "usage: %prog [options] file1 file2"
              parser = OptionParser(usage=usage)
              parser.add_option("-d", "--difflib", action="store_true", default=False)
              parser.add_option('-x', '--count', default=1)
              parser.add_option('-c', '--context', type="int", default=3)
              parser.add_option('-p', '--show-c-function', action="store_true", default=False)
              parser.add_option('-w', '--ignore-all-space', action="store_true",
                                default=False)
              (options, args) = parser.parse_args()
              if not args:
                  parser.print_help()
                  sys.exit(1)
-             # somewhat self contained replacement for difflib.unified_diff
-             # t1 and t2 are the text to be diffed
-             # l1 and l2 are the text broken up into lines
-             # header1 and header2 are the filenames for the diff output
-             # context is the number of context lines
-             # showfunc enables diff -p output
-             # ignorews ignores all whitespace changes in the diff
-             def bunidiff(t1, t2, l1, l2, header1, header2, context=3, showfunc=False,
-                          ignorews=False):
-                 def contextend(l, len):
-                     ret = l + context
-                     if ret > len:
-                         ret = len
-                     return ret
-                 def contextstart(l):
-                     ret = l - context
-                     if ret < 0:
-                         return 0
-                     return ret
-                 def yieldhunk(hunk, header):
-                     if header:
-                         for x in header:
-                             yield x
-                     (astart, a2, bstart, b2, delta) = hunk
-                     aend = contextend(a2, len(l1))
-                     alen = aend - astart
-                     blen = b2 - bstart + aend - a2
-                     func = ""
-                     if showfunc:
-                         # walk backwards from the start of the context
-                         # to find a line starting with an alphanumeric char.
-                         for x in xrange(astart, -1, -1):
-                             t = l1[x]
-                             if funcre.match(t):
-                                 func = ' ' + t[:40]
-                                 break
-                     yield "@@ -%d,%d +%d,%d @@%s\n" % (astart + 1, alen,
-                                                        bstart + 1, blen, func)
-                     for x in delta:
-                         yield x
-                     for x in xrange(a2, aend):
-                         yield ' ' + l1[x]
-                 header = [ "--- %s\t\n" % header1, "+++ %s\t\n" % header2 ]
-                 if showfunc:
-                     funcre = re.compile('\w')
-                 if ignorews:
-                     wsre = re.compile('[ \t]')
-                 # bdiff.blocks gives us the matching sequences in the files.  The loop
-                 # below finds the spaces between those matching sequences and translates
-                 # them into diff output.
+                 #
-                 diff = blocks(t1, t2)
-                 hunk = None
-                 for i in xrange(len(diff)):
-                     # The first match is special.
-                     # we've either found a match starting at line 0 or a match later
-                     # in the file.  If it starts later, old and new below will both be
-                     # empty and we'll continue to the next match.
-                     if i > 0:
-                         s = diff[i-1]
-                     else:
-                         s = [0, 0, 0, 0]
-                     delta = []
-                     s1 = diff[i]
-                     a1 = s[1]
-                     a2 = s1[0]
-                     b1 = s[3]
-                     b2 = s1[2]
-                     old = l1[a1:a2]
-                     new = l2[b1:b2]
-                     # bdiff sometimes gives huge matches past eof, this check eats them,
-                     # and deals with the special first match case described above
-                     if not old and not new:
-                         continue
-                     if ignorews:
-                         wsold = wsre.sub('', "".join(old))
-                         wsnew = wsre.sub('', "".join(new))
-                         if wsold == wsnew:
-                             continue
-                     astart = contextstart(a1)
-                     bstart = contextstart(b1)
-                     prev = None
-                     if hunk:
-                         # join with the previous hunk if it falls inside the context
-                         if astart < hunk[1] + context + 1:
-                             prev = hunk
-                             astart = hunk[1]
-                             bstart = hunk[3]
-                         else:
-                             for x in yieldhunk(hunk, header):
-                                 yield x
-                             # we only want to yield the header if the files differ, and
-                             # we only want to yield it once.
-                             header = None
-                     if prev:
-                         # we've joined the previous hunk, record the new ending points.
-                         hunk[1] = a2
-                         hunk[3] = b2
-                         delta = hunk[4]
-                     else:
-                         # create a new hunk
-                         hunk = [ astart, a2, bstart, b2, delta ]
-                     delta[len(delta):] = [ ' ' + x for x in l1[astart:a1] ]
-                     delta[len(delta):] = [ '-' + x for x in old ]
-                     delta[len(delta):] = [ '+' + x for x in new ]
-                 if hunk:
-                     for x in yieldhunk(hunk, header):
-                         yield x
              # simple utility function to put all the
              # files from a directory tree into a dict
              def buildlist(names, top):
                  tlen = len(top)
                  for root, dirs, files in os.walk(top):
                      l = root[tlen + 1:]
                      for x in files:
                          p = os.path.join(root, x)
                          st = os.lstat(p)
                          if stat.S_ISREG(st.st_mode):
                              names[os.path.join(l, x)] = (st.st_dev, st.st_ino)
              def diff_files(file1, file2):
                  if file1 == None:
                      b = file(file2).read().splitlines(1)
                      l1 = "--- %s\n" % (file2)
                      l2 = "+++ %s\n" % (file2)
                      l3 = "@@ -0,0 +1,%d @@\n" % len(b)
                      l = [l1, l2, l3] + ["+" + e for e in b]
                  elif file2 == None:
                      a = file(file1).read().splitlines(1)
                      l1 = "--- %s\n" % (file1)
                      l2 = "+++ %s\n" % (file1)
                      l3 = "@@ -1,%d +0,0 @@\n" % len(a)
                      l = [l1, l2, l3] + ["-" + e for e in a]
                  else:
                      t1 = file(file1).read()
                      t2 = file(file2).read()
                      l1 = t1.splitlines(1)
                      l2 = t2.splitlines(1)
                      if options.difflib:
                          l = difflib.unified_diff(l1, l2, file1, file2)
                      else:
                          l = bunidiff(t1, t2, l1, l2, file1, file2, context=options.context,
                                   showfunc=options.show_c_function,
                                   ignorews=options.ignore_all_space)
                  for x in l:
                      if x[-1] != '\n':
                          x += "\n\ No newline at end of file\n"
                      print x,
              file1 = args[0]
              file2 = args[1]
              if os.path.isfile(file1) and os.path.isfile(file2):
                  diff_files(file1, file2)
              elif os.path.isdir(file1):
                  if not os.path.isdir(file2):
                      sys.stderr.write("file types don't match\n")
                      sys.exit(1)
                  d1 = {}
                  d2 = {}
                  buildlist(d1, file1)
                  buildlist(d2, file2)
                  keys = d1.keys()
                  keys.sort()
                  for x in keys:
                      if x not in d2:
                          f2 = None
                      else:
                          f2 = os.path.join(file2, x)
                          st1 = d1[x]
                          st2 = d2[x]
                          del d2[x]
                          if st1[0] == st2[0] and st1[1] == st2[1]:
                              sys.stderr.write("%s is a hard link\n" % x)
                              continue
                      x = os.path.join(file1, x)
                      diff_files(x, f2)
                  keys = d2.keys()
                  keys.sort()
                  for x in keys:
                      f1 = None
                      x = os.path.join(file2, x)
                      diff_files(f1, x)

General Comments 0

Write
Preview

You need to be logged in to leave comments. Login now

No TODOs yet

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages