bundlerepo.py
254 lines
| 9.2 KiB
| text/x-python
|
PythonLexer
/ mercurial / bundlerepo.py
Benoit Boissinot
|
r1942 | """ | ||
bundlerepo.py - repository class for viewing uncompressed bundles | ||||
This provides a read-only repository interface to bundles as if | ||||
they were part of the actual repository. | ||||
Thomas Arendsen Hein
|
r4635 | Copyright 2006, 2007 Benoit Boissinot <bboissin@gmail.com> | ||
Benoit Boissinot
|
r1942 | |||
This software may be used and distributed according to the terms | ||||
of the GNU General Public License, incorporated herein by reference. | ||||
""" | ||||
from node import * | ||||
Matt Mackall
|
r3891 | from i18n import _ | ||
Matt Mackall
|
r3877 | import changegroup, util, os, struct, bz2, tempfile | ||
Benoit Boissinot
|
r1942 | |||
Benoit Boissinot
|
r1946 | import localrepo, changelog, manifest, filelog, revlog | ||
Benoit Boissinot
|
r1942 | |||
Benoit Boissinot
|
r1946 | class bundlerevlog(revlog.revlog): | ||
Matt Mackall
|
r4257 | def __init__(self, opener, indexfile, bundlefile, | ||
Benoit Boissinot
|
r1942 | linkmapper=None): | ||
# How it works: | ||||
# to retrieve a revision, we need to know the offset of | ||||
# the revision in the bundlefile (an opened file). | ||||
# | ||||
# We store this offset in the index (start), to differentiate a | ||||
# rev in the bundle and from a rev in the revlog, we check | ||||
# len(index[r]). If the tuple is bigger than 7, it is a bundle | ||||
# (it is bigger since we store the node to which the delta is) | ||||
# | ||||
Matt Mackall
|
r4257 | revlog.revlog.__init__(self, opener, indexfile) | ||
Benoit Boissinot
|
r1942 | self.bundlefile = bundlefile | ||
mason@suse.com
|
r2074 | self.basemap = {} | ||
Thomas Arendsen Hein
|
r1981 | def chunkpositer(): | ||
for chunk in changegroup.chunkiter(bundlefile): | ||||
Benoit Boissinot
|
r1942 | pos = bundlefile.tell() | ||
Thomas Arendsen Hein
|
r1981 | yield chunk, pos - len(chunk) | ||
Benoit Boissinot
|
r1942 | n = self.count() | ||
prev = None | ||||
Thomas Arendsen Hein
|
r1981 | for chunk, start in chunkpositer(): | ||
Benoit Boissinot
|
r1942 | size = len(chunk) | ||
if size < 80: | ||||
raise util.Abort("invalid changegroup") | ||||
start += 80 | ||||
size -= 80 | ||||
node, p1, p2, cs = struct.unpack("20s20s20s20s", chunk[:80]) | ||||
if node in self.nodemap: | ||||
prev = node | ||||
continue | ||||
for p in (p1, p2): | ||||
if not p in self.nodemap: | ||||
Brendan Cully
|
r3930 | raise revlog.LookupError(_("unknown parent %s") % short(p1)) | ||
Benoit Boissinot
|
r1942 | if linkmapper is None: | ||
link = n | ||||
else: | ||||
link = linkmapper(cs) | ||||
if not prev: | ||||
prev = p1 | ||||
# start, size, base is not used, link, p1, p2, delta ref | ||||
Thomas Arendsen Hein
|
r3579 | if self.version == revlog.REVLOGV0: | ||
Chris Mason
|
r2101 | e = (start, size, None, link, p1, p2, node) | ||
else: | ||||
e = (self.offset_type(start, 0), size, -1, None, link, | ||||
self.rev(p1), self.rev(p2), node) | ||||
mason@suse.com
|
r2074 | self.basemap[n] = prev | ||
Benoit Boissinot
|
r1942 | self.index.append(e) | ||
self.nodemap[node] = n | ||||
prev = node | ||||
n += 1 | ||||
def bundle(self, rev): | ||||
"""is rev from the bundle""" | ||||
if rev < 0: | ||||
return False | ||||
mason@suse.com
|
r2074 | return rev in self.basemap | ||
def bundlebase(self, rev): return self.basemap[rev] | ||||
Benoit Boissinot
|
r2256 | def chunk(self, rev, df=None, cachelen=4096): | ||
Benoit Boissinot
|
r1942 | # Warning: in case of bundle, the diff is against bundlebase, | ||
# not against rev - 1 | ||||
# XXX: could use some caching | ||||
if not self.bundle(rev): | ||||
Benoit Boissinot
|
r2256 | return revlog.revlog.chunk(self, rev, df, cachelen) | ||
Benoit Boissinot
|
r1942 | self.bundlefile.seek(self.start(rev)) | ||
return self.bundlefile.read(self.length(rev)) | ||||
def revdiff(self, rev1, rev2): | ||||
"""return or calculate a delta between two revisions""" | ||||
if self.bundle(rev1) and self.bundle(rev2): | ||||
# hot path for bundle | ||||
revb = self.rev(self.bundlebase(rev2)) | ||||
if revb == rev1: | ||||
return self.chunk(rev2) | ||||
elif not self.bundle(rev1) and not self.bundle(rev2): | ||||
Benoit Boissinot
|
r4028 | return revlog.revlog.revdiff(self, rev1, rev2) | ||
Benoit Boissinot
|
r1942 | |||
return self.diff(self.revision(self.node(rev1)), | ||||
self.revision(self.node(rev2))) | ||||
def revision(self, node): | ||||
"""return an uncompressed revision of a given""" | ||||
if node == nullid: return "" | ||||
text = None | ||||
chain = [] | ||||
iter_node = node | ||||
rev = self.rev(iter_node) | ||||
# reconstruct the revision if it is from a changegroup | ||||
while self.bundle(rev): | ||||
if self.cache and self.cache[0] == iter_node: | ||||
text = self.cache[2] | ||||
break | ||||
chain.append(rev) | ||||
iter_node = self.bundlebase(rev) | ||||
rev = self.rev(iter_node) | ||||
if text is None: | ||||
Benoit Boissinot
|
r1946 | text = revlog.revlog.revision(self, iter_node) | ||
Benoit Boissinot
|
r1942 | |||
while chain: | ||||
delta = self.chunk(chain.pop()) | ||||
text = self.patches(text, [delta]) | ||||
p1, p2 = self.parents(node) | ||||
Benoit Boissinot
|
r1946 | if node != revlog.hash(text, p1, p2): | ||
Benoit Boissinot
|
r2256 | raise revlog.RevlogError(_("integrity check failed on %s:%d") | ||
Benoit Boissinot
|
r2257 | % (self.datafile, self.rev(node))) | ||
Benoit Boissinot
|
r1942 | |||
Benoit Boissinot
|
r2129 | self.cache = (node, self.rev(node), text) | ||
Benoit Boissinot
|
r1942 | return text | ||
def addrevision(self, text, transaction, link, p1=None, p2=None, d=None): | ||||
raise NotImplementedError | ||||
def addgroup(self, revs, linkmapper, transaction, unique=0): | ||||
raise NotImplementedError | ||||
def strip(self, rev, minlink): | ||||
raise NotImplementedError | ||||
def checksize(self): | ||||
raise NotImplementedError | ||||
Benoit Boissinot
|
r1946 | class bundlechangelog(bundlerevlog, changelog.changelog): | ||
Benoit Boissinot
|
r1942 | def __init__(self, opener, bundlefile): | ||
Benoit Boissinot
|
r1946 | changelog.changelog.__init__(self, opener) | ||
Matt Mackall
|
r4257 | bundlerevlog.__init__(self, opener, self.indexfile, bundlefile) | ||
Benoit Boissinot
|
r1942 | |||
Benoit Boissinot
|
r1946 | class bundlemanifest(bundlerevlog, manifest.manifest): | ||
Benoit Boissinot
|
r1942 | def __init__(self, opener, bundlefile, linkmapper): | ||
Benoit Boissinot
|
r1946 | manifest.manifest.__init__(self, opener) | ||
Matt Mackall
|
r4257 | bundlerevlog.__init__(self, opener, self.indexfile, bundlefile, | ||
linkmapper) | ||||
Benoit Boissinot
|
r1942 | |||
Benoit Boissinot
|
r1946 | class bundlefilelog(bundlerevlog, filelog.filelog): | ||
Benoit Boissinot
|
r1942 | def __init__(self, opener, path, bundlefile, linkmapper): | ||
Benoit Boissinot
|
r1946 | filelog.filelog.__init__(self, opener, path) | ||
Matt Mackall
|
r4257 | bundlerevlog.__init__(self, opener, self.indexfile, bundlefile, | ||
linkmapper) | ||||
Benoit Boissinot
|
r1942 | |||
Benoit Boissinot
|
r1946 | class bundlerepository(localrepo.localrepository): | ||
Benoit Boissinot
|
r1942 | def __init__(self, ui, path, bundlename): | ||
Benoit Boissinot
|
r1946 | localrepo.localrepository.__init__(self, ui, path) | ||
Vadim Gelfer
|
r2673 | |||
self._url = 'bundle:' + bundlename | ||||
if path: self._url += '+' + path | ||||
Benoit Boissinot
|
r2273 | self.tempfile = None | ||
self.bundlefile = open(bundlename, "rb") | ||||
Benoit Boissinot
|
r1980 | header = self.bundlefile.read(6) | ||
if not header.startswith("HG"): | ||||
raise util.Abort(_("%s: not a Mercurial bundle file") % bundlename) | ||||
elif not header.startswith("HG10"): | ||||
raise util.Abort(_("%s: unknown bundle version") % bundlename) | ||||
elif header == "HG10BZ": | ||||
Benoit Boissinot
|
r2273 | fdtemp, temp = tempfile.mkstemp(prefix="hg-bundle-", | ||
suffix=".hg10un", dir=self.path) | ||||
self.tempfile = temp | ||||
fptemp = os.fdopen(fdtemp, 'wb') | ||||
def generator(f): | ||||
zd = bz2.BZ2Decompressor() | ||||
zd.decompress("BZ") | ||||
for chunk in f: | ||||
yield zd.decompress(chunk) | ||||
gen = generator(util.filechunkiter(self.bundlefile, 4096)) | ||||
try: | ||||
fptemp.write("HG10UN") | ||||
for chunk in gen: | ||||
fptemp.write(chunk) | ||||
finally: | ||||
fptemp.close() | ||||
self.bundlefile.close() | ||||
self.bundlefile = open(self.tempfile, "rb") | ||||
# seek right after the header | ||||
self.bundlefile.seek(6) | ||||
Benoit Boissinot
|
r1980 | elif header == "HG10UN": | ||
Benoit Boissinot
|
r2273 | # nothing to do | ||
Benoit Boissinot
|
r1980 | pass | ||
else: | ||||
raise util.Abort(_("%s: unknown bundle compression type") | ||||
% bundlename) | ||||
Benoit Boissinot
|
r3791 | self.changelog = bundlechangelog(self.sopener, self.bundlefile) | ||
self.manifest = bundlemanifest(self.sopener, self.bundlefile, | ||||
Benoit Boissinot
|
r1942 | self.changelog.rev) | ||
# dict with the mapping 'filename' -> position in the bundle | ||||
self.bundlefilespos = {} | ||||
while 1: | ||||
Thomas Arendsen Hein
|
r1981 | f = changegroup.getchunk(self.bundlefile) | ||
if not f: | ||||
break | ||||
self.bundlefilespos[f] = self.bundlefile.tell() | ||||
for c in changegroup.chunkiter(self.bundlefile): | ||||
pass | ||||
Benoit Boissinot
|
r1942 | |||
Vadim Gelfer
|
r2673 | def url(self): | ||
return self._url | ||||
Benoit Boissinot
|
r1942 | def dev(self): | ||
return -1 | ||||
def file(self, f): | ||||
if f[0] == '/': | ||||
f = f[1:] | ||||
if f in self.bundlefilespos: | ||||
self.bundlefile.seek(self.bundlefilespos[f]) | ||||
Benoit Boissinot
|
r3791 | return bundlefilelog(self.sopener, f, self.bundlefile, | ||
Benoit Boissinot
|
r1942 | self.changelog.rev) | ||
else: | ||||
Benoit Boissinot
|
r3791 | return filelog.filelog(self.sopener, f) | ||
Benoit Boissinot
|
r1942 | |||
Thomas Arendsen Hein
|
r1971 | def close(self): | ||
"""Close assigned bundle file immediately.""" | ||||
self.bundlefile.close() | ||||
Benoit Boissinot
|
r2273 | |||
def __del__(self): | ||||
Alexis S. L. Carvalho
|
r3429 | bundlefile = getattr(self, 'bundlefile', None) | ||
if bundlefile and not bundlefile.closed: | ||||
bundlefile.close() | ||||
tempfile = getattr(self, 'tempfile', None) | ||||
if tempfile is not None: | ||||
os.unlink(tempfile) | ||||
Vadim Gelfer
|
r2740 | |||
def instance(ui, path, create): | ||||
if create: | ||||
raise util.Abort(_('cannot create new bundle repository')) | ||||
path = util.drop_scheme('file', path) | ||||
if path.startswith('bundle:'): | ||||
path = util.drop_scheme('bundle', path) | ||||
s = path.split("+", 1) | ||||
if len(s) == 1: | ||||
repopath, bundlename = "", s[0] | ||||
else: | ||||
repopath, bundlename = s | ||||
else: | ||||
repopath, bundlename = '', path | ||||
return bundlerepository(ui, repopath, bundlename) | ||||