##// END OF EJS Templates
mdiff: reinstate new algorithm...
mpm@selenic.com -
r325:ad87e198 default
parent child Browse files
Show More
@@ -1,99 +1,115 b''
1 1 # mdiff.py - diff and patch routines for mercurial
2 2 #
3 3 # Copyright 2005 Matt Mackall <mpm@selenic.com>
4 4 #
5 5 # This software may be used and distributed according to the terms
6 6 # of the GNU General Public License, incorporated herein by reference.
7 7
8 8 import difflib, struct
9 9 from mercurial.mpatch import *
10 10
11 11 def unidiff(a, ad, b, bd, fn):
12 12 if not a and not b: return ""
13 13
14 14 if a == None:
15 15 b = b.splitlines(1)
16 16 l1 = "--- %s\t%s\n" % ("/dev/null", ad)
17 17 l2 = "+++ %s\t%s\n" % ("b/" + fn, bd)
18 18 l3 = "@@ -0,0 +1,%d @@\n" % len(b)
19 19 l = [l1, l2, l3] + ["+" + e for e in b]
20 20 elif b == None:
21 21 a = a.splitlines(1)
22 22 l1 = "--- %s\t%s\n" % ("a/" + fn, ad)
23 23 l2 = "+++ %s\t%s\n" % ("/dev/null", bd)
24 24 l3 = "@@ -1,%d +0,0 @@\n" % len(a)
25 25 l = [l1, l2, l3] + ["-" + e for e in a]
26 26 else:
27 27 a = a.splitlines(1)
28 28 b = b.splitlines(1)
29 29 l = list(difflib.unified_diff(a, b, "a/" + fn, "b/" + fn))
30 30 if not l: return ""
31 31 # difflib uses a space, rather than a tab
32 32 l[0] = l[0][:-2] + "\t" + ad + "\n"
33 33 l[1] = l[1][:-2] + "\t" + bd + "\n"
34 34
35 35 for ln in xrange(len(l)):
36 36 if l[ln][-1] != '\n':
37 37 l[ln] += "\n\ No newline at end of file\n"
38 38
39 39 return "".join(l)
40 40
41 41 def textdiff(a, b):
42 42 return diff(a.splitlines(1), b.splitlines(1))
43 43
44 44 def sortdiff(a, b):
45 45 la = lb = 0
46 lena = len(a)
47 lenb = len(b)
46 48
47 49 while 1:
48 if la >= len(a) or lb >= len(b): break
49 if b[lb] < a[la]:
50 si = lb
51 while lb < len(b) and b[lb] < a[la] : lb += 1
52 yield "insert", la, la, si, lb
53 elif a[la] < b[lb]:
54 si = la
55 while la < len(a) and a[la] < b[lb]: la += 1
56 yield "delete", si, la, lb, lb
57 else:
50 am, bm, = la, lb
51
52 # walk over matching lines
53 while lb < lenb and la < lenb and a[la] == b[lb] :
58 54 la += 1
59 55 lb += 1
60 56
61 if lb < len(b):
62 yield "insert", la, la, lb, len(b)
57 if la > am:
58 yield (am, bm, la - am) # return a match
59
60 # skip mismatched lines from b
61 while lb < lenb and b[lb] < a[la]:
62 lb += 1
63 63
64 if la < len(a):
65 yield "delete", la, len(a), lb, lb
64 if lb >= lenb:
65 break
66
67 # skip mismatched lines from a
68 while la < lena and b[lb] > a[la]:
69 la += 1
70
71 if la >= lena:
72 break
73
74 yield (lena, lenb, 0)
66 75
67 76 def diff(a, b, sorted=0):
77 if not a:
78 s = "".join(b)
79 return s and (struct.pack(">lll", 0, 0, len(s)) + s)
80
68 81 bin = []
69 82 p = [0]
70 83 for i in a: p.append(p[-1] + len(i))
71 84
72 85 if sorted:
73 86 try:
74 87 d = sortdiff(a, b)
75 88 except:
76 89 print a, b
77 90 raise
78 91 else:
79 d = difflib.SequenceMatcher(None, a, b).get_opcodes()
80
81 for o, m, n, s, t in d:
82 if o == 'equal': continue
83 s = "".join(b[s:t])
84 bin.append(struct.pack(">lll", p[m], p[n], len(s)) + s)
92 d = difflib.SequenceMatcher(None, a, b).get_matching_blocks()
93 la = 0
94 lb = 0
95 for am, bm, size in d:
96 s = "".join(b[lb:bm])
97 if am > la or s:
98 bin.append(struct.pack(">lll", p[la], p[am], len(s)) + s)
99 la = am + size
100 lb = bm + size
85 101
86 102 return "".join(bin)
87 103
88 104 def patchtext(bin):
89 105 pos = 0
90 106 t = []
91 107 while pos < len(bin):
92 108 p1, p2, l = struct.unpack(">lll", bin[pos:pos + 12])
93 109 pos += 12
94 110 t.append(bin[pos:pos + l])
95 111 pos += l
96 112 return "".join(t)
97 113
98 114 def patch(a, bin):
99 115 return patches(a, [bin])
General Comments 0
You need to be logged in to leave comments. Login now