upstream/mercurial-mirror Commit - r7699:fac054f8

pure Python implementation of mpatch.c

Martin Geisler -

r7699:fac054f8 default

parent child

mercurial/pure/mpatch.py

0 created 644 +103 0

			@@ -0,0 +1,103 b''
		1	# mpatch.py - Python implementation of mpatch.c
		2	#
		3	# Copyright 2009 Matt Mackall <mpm@selenic.com> and others
		4	#
		5	# This software may be used and distributed according to the terms
		6	# of the GNU General Public License, incorporated herein by reference.
		7
		8	import struct, mmap
		9
		10	devzero = file("/dev/zero")
		11
		12	# This attempts to apply a series of patches in time proportional to
		13	# the total size of the patches, rather than patches * len(text). This
		14	# means rather than shuffling strings around, we shuffle around
		15	# pointers to fragments with fragment lists.
		16	#
		17	# When the fragment lists get too long, we collapse them. To do this
		18	# efficiently, we do all our operations inside a buffer created by
		19	# mmap and simply use memmove. This avoids creating a bunch of large
		20	# temporary string buffers.
		21
		22	def patches(a, bins):
		23	if not bins: return a
		24
		25	plens = [len(x) for x in bins]
		26	pl = sum(plens)
		27	bl = len(a) + pl
		28	tl = bl + bl + pl # enough for the patches and two working texts
		29	b1, b2 = 0, bl
		30
		31	if not tl: return a
		32
		33	m = mmap.mmap(devzero.fileno(), tl, mmap.MAP_PRIVATE)
		34
		35	# load our original text
		36	m.write(a)
		37	frags = [(len(a), b1)]
		38
		39	# copy all the patches into our segment so we can memmove from them
		40	pos = b2 + bl
		41	m.seek(pos)
		42	for p in bins: m.write(p)
		43
		44	def pull(dst, src, l): # pull l bytes from src
		45	while l:
		46	f = src.pop(0)
		47	if f[0] > l: # do we need to split?
		48	src.insert(0, (f[0] - l, f[1] + l))
		49	dst.append((l, f[1]))
		50	return
		51	dst.append(f)
		52	l -= f[0]
		53
		54	def collect(buf, list):
		55	start = buf
		56	for l, p in list:
		57	m.move(buf, p, l)
		58	buf += l
		59	return (buf - start, start)
		60
		61	for plen in plens:
		62	# if our list gets too long, execute it
		63	if len(frags) > 128:
		64	b2, b1 = b1, b2
		65	frags = [collect(b1, frags)]
		66
		67	new = []
		68	end = pos + plen
		69	last = 0
		70	while pos < end:
		71	p1, p2, l = struct.unpack(">lll", m[pos:pos + 12])
		72	pull(new, frags, p1 - last) # what didn't change
		73	pull([], frags, p2 - p1) # what got deleted
		74	new.append((l, pos + 12)) # what got added
		75	pos += l + 12
		76	last = p2
		77	frags = new + frags # what was left at the end
		78
		79	t = collect(b2, frags)
		80
		81	return m[t[1]:t[1] + t[0]]
		82
		83	def patchedsize(orig, delta):
		84	outlen, last, bin = 0, 0, 0
		85	binend = len(delta)
		86	data = 12
		87
		88	while data <= binend:
		89	decode = delta[bin:bin + 12]
		90	start, end, length = struct.unpack(">lll", decode)
		91	if start > end:
		92	break
		93	bin = data + length
		94	data = bin + 12
		95	outlen += start - last
		96	last = end
		97	outlen += length
		98
		99	if bin != binend:
		100	raise Exception("patch cannot be decoded")
		101
		102	outlen += orig - last
		103	return outlen

General Comments 0

Write
Preview

You need to be logged in to leave comments. Login now

No TODOs yet

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages