bundlerepo.py
290 lines
| 9.9 KiB
| text/x-python
|
PythonLexer
/ mercurial / bundlerepo.py
Martin Geisler
|
r8226 | # bundlerepo.py - repository class for viewing uncompressed bundles | ||
# | ||||
# Copyright 2006, 2007 Benoit Boissinot <bboissin@gmail.com> | ||||
# | ||||
# This software may be used and distributed according to the terms of the | ||||
Matt Mackall
|
r10263 | # GNU General Public License version 2 or any later version. | ||
Benoit Boissinot
|
r1942 | |||
Martin Geisler
|
r8227 | """Repository class for viewing uncompressed bundles. | ||
This provides a read-only repository interface to bundles as if they | ||||
were part of the actual repository. | ||||
""" | ||||
Peter Arrenbrecht
|
r7873 | from node import nullid | ||
Matt Mackall
|
r3891 | from i18n import _ | ||
Matt Mackall
|
r12044 | import os, struct, tempfile, shutil | ||
Simon Heimberg
|
r8312 | import changegroup, util, mdiff | ||
Peter Arrenbrecht
|
r7873 | import localrepo, changelog, manifest, filelog, revlog, error | ||
Benoit Boissinot
|
r1942 | |||
Benoit Boissinot
|
r1946 | class bundlerevlog(revlog.revlog): | ||
Matt Mackall
|
r12332 | def __init__(self, opener, indexfile, bundle, | ||
Benoit Boissinot
|
r1942 | linkmapper=None): | ||
# How it works: | ||||
# to retrieve a revision, we need to know the offset of | ||||
Matt Mackall
|
r12332 | # the revision in the bundle (an unbundle object). | ||
Benoit Boissinot
|
r1942 | # | ||
# We store this offset in the index (start), to differentiate a | ||||
# rev in the bundle and from a rev in the revlog, we check | ||||
# len(index[r]). If the tuple is bigger than 7, it is a bundle | ||||
# (it is bigger since we store the node to which the delta is) | ||||
# | ||||
Matt Mackall
|
r4257 | revlog.revlog.__init__(self, opener, indexfile) | ||
Matt Mackall
|
r12332 | self.bundle = bundle | ||
mason@suse.com
|
r2074 | self.basemap = {} | ||
Thomas Arendsen Hein
|
r1981 | def chunkpositer(): | ||
Matt Mackall
|
r12335 | while 1: | ||
chunk = bundle.chunk() | ||||
if not chunk: | ||||
break | ||||
Matt Mackall
|
r12332 | pos = bundle.tell() | ||
Thomas Arendsen Hein
|
r1981 | yield chunk, pos - len(chunk) | ||
Matt Mackall
|
r6750 | n = len(self) | ||
Benoit Boissinot
|
r1942 | prev = None | ||
Thomas Arendsen Hein
|
r1981 | for chunk, start in chunkpositer(): | ||
Benoit Boissinot
|
r1942 | size = len(chunk) | ||
if size < 80: | ||||
Martin Geisler
|
r6953 | raise util.Abort(_("invalid changegroup")) | ||
Benoit Boissinot
|
r1942 | start += 80 | ||
size -= 80 | ||||
node, p1, p2, cs = struct.unpack("20s20s20s20s", chunk[:80]) | ||||
if node in self.nodemap: | ||||
prev = node | ||||
continue | ||||
for p in (p1, p2): | ||||
if not p in self.nodemap: | ||||
Sune Foldager
|
r9650 | raise error.LookupError(p, self.indexfile, | ||
Matt Mackall
|
r7633 | _("unknown parent")) | ||
Benoit Boissinot
|
r1942 | if linkmapper is None: | ||
link = n | ||||
else: | ||||
link = linkmapper(cs) | ||||
if not prev: | ||||
prev = p1 | ||||
Benoit Boissinot
|
r5167 | # start, size, full unc. size, base (unused), link, p1, p2, node | ||
e = (revlog.offset_type(start, 0), size, -1, -1, link, | ||||
Matt Mackall
|
r4979 | self.rev(p1), self.rev(p2), node) | ||
mason@suse.com
|
r2074 | self.basemap[n] = prev | ||
Matt Mackall
|
r4979 | self.index.insert(-1, e) | ||
Benoit Boissinot
|
r1942 | self.nodemap[node] = n | ||
prev = node | ||||
n += 1 | ||||
Matt Mackall
|
r12332 | def inbundle(self, rev): | ||
Benoit Boissinot
|
r1942 | """is rev from the bundle""" | ||
if rev < 0: | ||||
return False | ||||
mason@suse.com
|
r2074 | return rev in self.basemap | ||
Matt Mackall
|
r10282 | def bundlebase(self, rev): | ||
return self.basemap[rev] | ||||
Benoit Boissinot
|
r9676 | def _chunk(self, rev): | ||
Benoit Boissinot
|
r1942 | # Warning: in case of bundle, the diff is against bundlebase, | ||
# not against rev - 1 | ||||
# XXX: could use some caching | ||||
Matt Mackall
|
r12332 | if not self.inbundle(rev): | ||
Benoit Boissinot
|
r9676 | return revlog.revlog._chunk(self, rev) | ||
Matt Mackall
|
r12332 | self.bundle.seek(self.start(rev)) | ||
return self.bundle.read(self.length(rev)) | ||||
Benoit Boissinot
|
r1942 | |||
def revdiff(self, rev1, rev2): | ||||
"""return or calculate a delta between two revisions""" | ||||
Matt Mackall
|
r12332 | if self.inbundle(rev1) and self.inbundle(rev2): | ||
Benoit Boissinot
|
r1942 | # hot path for bundle | ||
revb = self.rev(self.bundlebase(rev2)) | ||||
if revb == rev1: | ||||
Benoit Boissinot
|
r9676 | return self._chunk(rev2) | ||
Matt Mackall
|
r12332 | elif not self.inbundle(rev1) and not self.inbundle(rev2): | ||
Benoit Boissinot
|
r4028 | return revlog.revlog.revdiff(self, rev1, rev2) | ||
Benoit Boissinot
|
r1942 | |||
Matt Mackall
|
r4989 | return mdiff.textdiff(self.revision(self.node(rev1)), | ||
Benoit Boissinot
|
r1942 | self.revision(self.node(rev2))) | ||
def revision(self, node): | ||||
"""return an uncompressed revision of a given""" | ||||
Matt Mackall
|
r10282 | if node == nullid: | ||
return "" | ||||
Benoit Boissinot
|
r1942 | |||
text = None | ||||
chain = [] | ||||
iter_node = node | ||||
rev = self.rev(iter_node) | ||||
# reconstruct the revision if it is from a changegroup | ||||
Matt Mackall
|
r12332 | while self.inbundle(rev): | ||
Matt Mackall
|
r4984 | if self._cache and self._cache[0] == iter_node: | ||
text = self._cache[2] | ||||
Benoit Boissinot
|
r1942 | break | ||
chain.append(rev) | ||||
iter_node = self.bundlebase(rev) | ||||
rev = self.rev(iter_node) | ||||
if text is None: | ||||
Benoit Boissinot
|
r1946 | text = revlog.revlog.revision(self, iter_node) | ||
Benoit Boissinot
|
r1942 | |||
while chain: | ||||
Benoit Boissinot
|
r9676 | delta = self._chunk(chain.pop()) | ||
Matt Mackall
|
r4989 | text = mdiff.patches(text, [delta]) | ||
Benoit Boissinot
|
r1942 | |||
p1, p2 = self.parents(node) | ||||
Benoit Boissinot
|
r1946 | if node != revlog.hash(text, p1, p2): | ||
Matt Mackall
|
r7633 | raise error.RevlogError(_("integrity check failed on %s:%d") | ||
Benoit Boissinot
|
r2257 | % (self.datafile, self.rev(node))) | ||
Benoit Boissinot
|
r1942 | |||
Matt Mackall
|
r4984 | self._cache = (node, self.rev(node), text) | ||
Benoit Boissinot
|
r1942 | return text | ||
def addrevision(self, text, transaction, link, p1=None, p2=None, d=None): | ||||
raise NotImplementedError | ||||
Peter Arrenbrecht
|
r6647 | def addgroup(self, revs, linkmapper, transaction): | ||
Benoit Boissinot
|
r1942 | raise NotImplementedError | ||
def strip(self, rev, minlink): | ||||
raise NotImplementedError | ||||
def checksize(self): | ||||
raise NotImplementedError | ||||
Benoit Boissinot
|
r1946 | class bundlechangelog(bundlerevlog, changelog.changelog): | ||
Matt Mackall
|
r12332 | def __init__(self, opener, bundle): | ||
Benoit Boissinot
|
r1946 | changelog.changelog.__init__(self, opener) | ||
Matt Mackall
|
r12332 | bundlerevlog.__init__(self, opener, self.indexfile, bundle) | ||
Benoit Boissinot
|
r1942 | |||
Benoit Boissinot
|
r1946 | class bundlemanifest(bundlerevlog, manifest.manifest): | ||
Matt Mackall
|
r12332 | def __init__(self, opener, bundle, linkmapper): | ||
Benoit Boissinot
|
r1946 | manifest.manifest.__init__(self, opener) | ||
Matt Mackall
|
r12332 | bundlerevlog.__init__(self, opener, self.indexfile, bundle, | ||
Matt Mackall
|
r4257 | linkmapper) | ||
Benoit Boissinot
|
r1942 | |||
Benoit Boissinot
|
r1946 | class bundlefilelog(bundlerevlog, filelog.filelog): | ||
Matt Mackall
|
r12332 | def __init__(self, opener, path, bundle, linkmapper): | ||
Benoit Boissinot
|
r1946 | filelog.filelog.__init__(self, opener, path) | ||
Matt Mackall
|
r12332 | bundlerevlog.__init__(self, opener, self.indexfile, bundle, | ||
Matt Mackall
|
r4257 | linkmapper) | ||
Benoit Boissinot
|
r1942 | |||
Benoit Boissinot
|
r1946 | class bundlerepository(localrepo.localrepository): | ||
Benoit Boissinot
|
r1942 | def __init__(self, ui, path, bundlename): | ||
John Mulligan
|
r6314 | self._tempparent = None | ||
try: | ||||
localrepo.localrepository.__init__(self, ui, path) | ||||
Matt Mackall
|
r7637 | except error.RepoError: | ||
John Mulligan
|
r6314 | self._tempparent = tempfile.mkdtemp() | ||
Martin Geisler
|
r9198 | localrepo.instance(ui, self._tempparent, 1) | ||
John Mulligan
|
r6314 | localrepo.localrepository.__init__(self, ui, self._tempparent) | ||
Vadim Gelfer
|
r2673 | |||
Peter Arrenbrecht
|
r6129 | if path: | ||
Alexander Solovyov
|
r11154 | self._url = 'bundle:' + util.expandpath(path) + '+' + bundlename | ||
Peter Arrenbrecht
|
r6129 | else: | ||
self._url = 'bundle:' + bundlename | ||||
Vadim Gelfer
|
r2673 | |||
Benoit Boissinot
|
r2273 | self.tempfile = None | ||
Matt Mackall
|
r12332 | f = open(bundlename, "rb") | ||
self.bundle = changegroup.readbundle(f, bundlename) | ||||
if self.bundle.compressed(): | ||||
Benoit Boissinot
|
r2273 | fdtemp, temp = tempfile.mkstemp(prefix="hg-bundle-", | ||
suffix=".hg10un", dir=self.path) | ||||
self.tempfile = temp | ||||
fptemp = os.fdopen(fdtemp, 'wb') | ||||
try: | ||||
fptemp.write("HG10UN") | ||||
Matt Mackall
|
r12044 | while 1: | ||
Matt Mackall
|
r12332 | chunk = self.bundle.read(2**18) | ||
Matt Mackall
|
r12044 | if not chunk: | ||
break | ||||
Benoit Boissinot
|
r2273 | fptemp.write(chunk) | ||
finally: | ||||
fptemp.close() | ||||
Matt Mackall
|
r12332 | f = open(self.tempfile, "rb") | ||
self.bundle = changegroup.readbundle(f, bundlename) | ||||
Matt Mackall
|
r12044 | |||
Benoit Boissinot
|
r1942 | # dict with the mapping 'filename' -> position in the bundle | ||
self.bundlefilespos = {} | ||||
Brendan Cully
|
r5262 | |||
Matt Mackall
|
r8260 | @util.propertycache | ||
def changelog(self): | ||||
Matt Mackall
|
r12332 | c = bundlechangelog(self.sopener, self.bundle) | ||
self.manstart = self.bundle.tell() | ||||
Matt Mackall
|
r8260 | return c | ||
@util.propertycache | ||||
def manifest(self): | ||||
Matt Mackall
|
r12332 | self.bundle.seek(self.manstart) | ||
m = bundlemanifest(self.sopener, self.bundle, self.changelog.rev) | ||||
self.filestart = self.bundle.tell() | ||||
Matt Mackall
|
r8260 | return m | ||
@util.propertycache | ||||
def manstart(self): | ||||
self.changelog | ||||
return self.manstart | ||||
@util.propertycache | ||||
def filestart(self): | ||||
self.manifest | ||||
return self.filestart | ||||
Benoit Boissinot
|
r1942 | |||
Vadim Gelfer
|
r2673 | def url(self): | ||
return self._url | ||||
Benoit Boissinot
|
r1942 | def file(self, f): | ||
Brendan Cully
|
r5262 | if not self.bundlefilespos: | ||
Matt Mackall
|
r12332 | self.bundle.seek(self.filestart) | ||
Brendan Cully
|
r5262 | while 1: | ||
Matt Mackall
|
r12333 | chunk = self.bundle.chunk() | ||
Brendan Cully
|
r5262 | if not chunk: | ||
break | ||||
Matt Mackall
|
r12332 | self.bundlefilespos[chunk] = self.bundle.tell() | ||
Matt Mackall
|
r12335 | while 1: | ||
c = self.bundle.chunk() | ||||
if not c: | ||||
break | ||||
Brendan Cully
|
r5262 | |||
Benoit Boissinot
|
r1942 | if f[0] == '/': | ||
f = f[1:] | ||||
if f in self.bundlefilespos: | ||||
Matt Mackall
|
r12332 | self.bundle.seek(self.bundlefilespos[f]) | ||
return bundlefilelog(self.sopener, f, self.bundle, | ||||
Benoit Boissinot
|
r1942 | self.changelog.rev) | ||
else: | ||||
Benoit Boissinot
|
r3791 | return filelog.filelog(self.sopener, f) | ||
Benoit Boissinot
|
r1942 | |||
Matt Mackall
|
r12347 | def close(self): | ||
"""Close assigned bundle file immediately.""" | ||||
self.bundle.close() | ||||
Benoit Boissinot
|
r2273 | def __del__(self): | ||
Matt Mackall
|
r12332 | del self.bundle | ||
Alexis S. L. Carvalho
|
r3429 | if tempfile is not None: | ||
os.unlink(tempfile) | ||||
John Mulligan
|
r6314 | if self._tempparent: | ||
shutil.rmtree(self._tempparent, True) | ||||
Vadim Gelfer
|
r2740 | |||
Matt Mackall
|
r6315 | def cancopy(self): | ||
return False | ||||
Dirkjan Ochtman
|
r7435 | def getcwd(self): | ||
return os.getcwd() # always outside the repo | ||||
Vadim Gelfer
|
r2740 | def instance(ui, path, create): | ||
if create: | ||||
raise util.Abort(_('cannot create new bundle repository')) | ||||
Peter Arrenbrecht
|
r5664 | parentpath = ui.config("bundle", "mainreporoot", "") | ||
if parentpath: | ||||
# Try to make the full path relative so we get a nice, short URL. | ||||
# In particular, we don't want temp dir names in test outputs. | ||||
cwd = os.getcwd() | ||||
if parentpath == cwd: | ||||
parentpath = '' | ||||
else: | ||||
cwd = os.path.join(cwd,'') | ||||
if parentpath.startswith(cwd): | ||||
parentpath = parentpath[len(cwd):] | ||||
Vadim Gelfer
|
r2740 | path = util.drop_scheme('file', path) | ||
if path.startswith('bundle:'): | ||||
path = util.drop_scheme('bundle', path) | ||||
s = path.split("+", 1) | ||||
if len(s) == 1: | ||||
Peter Arrenbrecht
|
r5664 | repopath, bundlename = parentpath, s[0] | ||
Vadim Gelfer
|
r2740 | else: | ||
repopath, bundlename = s | ||||
else: | ||||
Peter Arrenbrecht
|
r5664 | repopath, bundlename = parentpath, path | ||
Vadim Gelfer
|
r2740 | return bundlerepository(ui, repopath, bundlename) | ||