Show More
archival.py
360 lines
| 11.0 KiB
| text/x-python
|
PythonLexer
/ mercurial / archival.py
Vadim Gelfer
|
r2112 | # archival.py - revision archival for mercurial | ||
# | ||||
# Copyright 2006 Vadim Gelfer <vadim.gelfer@gmail.com> | ||||
# | ||||
Martin Geisler
|
r8225 | # This software may be used and distributed according to the terms of the | ||
Matt Mackall
|
r10263 | # GNU General Public License version 2 or any later version. | ||
Vadim Gelfer
|
r2112 | |||
Gregory Szorc
|
r25916 | from __future__ import absolute_import | ||
import gzip | ||||
import os | ||||
FUJIWARA Katsunori
|
r17628 | import struct | ||
Gregory Szorc
|
r25916 | import tarfile | ||
import time | ||||
import zipfile | ||||
import zlib | ||||
from .i18n import _ | ||||
from . import ( | ||||
error, | ||||
Matt Harbison
|
r33544 | formatter, | ||
Gregory Szorc
|
r25916 | match as matchmod, | ||
Matt Harbison
|
r36156 | scmutil, | ||
Gregory Szorc
|
r25916 | util, | ||
Pierre-Yves David
|
r31235 | vfs as vfsmod, | ||
Gregory Szorc
|
r25916 | ) | ||
timeless
|
r28861 | stringio = util.stringio | ||
Vadim Gelfer
|
r2112 | |||
Mads Kiilerich
|
r17429 | # from unzip source code: | ||
_UNX_IFREG = 0x8000 | ||||
_UNX_IFLNK = 0xa000 | ||||
Martin Geisler
|
r11558 | def tidyprefix(dest, kind, prefix): | ||
Vadim Gelfer
|
r2112 | '''choose prefix to use for names in archive. make sure prefix is | ||
safe for consumers.''' | ||||
if prefix: | ||||
Shun-ichi GOTO
|
r5842 | prefix = util.normpath(prefix) | ||
Vadim Gelfer
|
r2112 | else: | ||
Pulkit Goyal
|
r36455 | if not isinstance(dest, bytes): | ||
Vadim Gelfer
|
r2112 | raise ValueError('dest must be string if no prefix') | ||
prefix = os.path.basename(dest) | ||||
lower = prefix.lower() | ||||
Martin Geisler
|
r11558 | for sfx in exts.get(kind, []): | ||
Vadim Gelfer
|
r2112 | if lower.endswith(sfx): | ||
prefix = prefix[:-len(sfx)] | ||||
break | ||||
lpfx = os.path.normpath(util.localpath(prefix)) | ||||
prefix = util.pconvert(lpfx) | ||||
if not prefix.endswith('/'): | ||||
prefix += '/' | ||||
Matt Harbison
|
r24953 | # Drop the leading '.' path component if present, so Windows can read the | ||
# zip files (issue4634) | ||||
if prefix.startswith('./'): | ||||
prefix = prefix[2:] | ||||
Vadim Gelfer
|
r2112 | if prefix.startswith('../') or os.path.isabs(lpfx) or '/../' in prefix: | ||
Pierre-Yves David
|
r26587 | raise error.Abort(_('archive prefix contains illegal components')) | ||
Vadim Gelfer
|
r2112 | return prefix | ||
Martin Geisler
|
r11557 | exts = { | ||
'tar': ['.tar'], | ||||
'tbz2': ['.tbz2', '.tar.bz2'], | ||||
'tgz': ['.tgz', '.tar.gz'], | ||||
'zip': ['.zip'], | ||||
} | ||||
def guesskind(dest): | ||||
for kind, extensions in exts.iteritems(): | ||||
Augie Fackler
|
r25149 | if any(dest.endswith(ext) for ext in extensions): | ||
Martin Geisler
|
r11557 | return kind | ||
return None | ||||
Yuya Nishihara
|
r24681 | def _rootctx(repo): | ||
# repo[0] may be hidden | ||||
for rev in repo: | ||||
return repo[rev] | ||||
return repo['null'] | ||||
Yuya Nishihara
|
r35923 | # {tags} on ctx includes local tags and 'tip', with no current way to limit | ||
# that to global tags. Therefore, use {latesttag} as a substitute when | ||||
# the distance is 0, since that will be the list of global tags on ctx. | ||||
_defaultmetatemplate = br''' | ||||
repo: {root} | ||||
node: {ifcontains(rev, revset("wdir()"), "{p1node}{dirty}", "{node}")} | ||||
branch: {branch|utf8} | ||||
{ifeq(latesttagdistance, 0, join(latesttag % "tag: {tag}", "\n"), | ||||
separate("\n", | ||||
join(latesttag % "latesttag: {tag}", "\n"), | ||||
"latesttagdistance: {latesttagdistance}", | ||||
"changessincelatesttag: {changessincelatesttag}"))} | ||||
'''[1:] # drop leading '\n' | ||||
Yuya Nishihara
|
r24678 | def buildmetadata(ctx): | ||
'''build content of .hg_archival.txt''' | ||||
repo = ctx.repo() | ||||
Matt Harbison
|
r33544 | |||
opts = { | ||||
Matt Harbison
|
r33545 | 'template': repo.ui.config('experimental', 'archivemetatemplate', | ||
Yuya Nishihara
|
r35923 | _defaultmetatemplate) | ||
Matt Harbison
|
r33544 | } | ||
out = util.stringio() | ||||
Yuya Nishihara
|
r24678 | |||
Matt Harbison
|
r33544 | fm = formatter.formatter(repo.ui, out, 'archive', opts) | ||
fm.startitem() | ||||
fm.context(ctx=ctx) | ||||
fm.data(root=_rootctx(repo).hex()) | ||||
if ctx.rev() is None: | ||||
dirty = '' | ||||
if ctx.dirty(missing=True): | ||||
dirty = '+' | ||||
fm.data(dirty=dirty) | ||||
fm.end() | ||||
return out.getvalue() | ||||
Martin Geisler
|
r11557 | |||
Benoit Boissinot
|
r8778 | class tarit(object): | ||
Vadim Gelfer
|
r2112 | '''write archive to tar file or stream. can write uncompressed, | ||
or compress with gzip or bzip2.''' | ||||
csaba.henk@creo.hu
|
r4652 | class GzipFileWithTime(gzip.GzipFile): | ||
def __init__(self, *args, **kw): | ||||
timestamp = None | ||||
if 'timestamp' in kw: | ||||
Pulkit Goyal
|
r35350 | timestamp = kw.pop(r'timestamp') | ||
Martin Geisler
|
r8527 | if timestamp is None: | ||
csaba.henk@creo.hu
|
r4652 | self.timestamp = time.time() | ||
else: | ||||
self.timestamp = timestamp | ||||
gzip.GzipFile.__init__(self, *args, **kw) | ||||
def _write_gzip_header(self): | ||||
self.fileobj.write('\037\213') # magic header | ||||
self.fileobj.write('\010') # compression method | ||||
timeless@mozdev.org
|
r26198 | fname = self.name | ||
Brodie Rao
|
r13102 | if fname and fname.endswith('.gz'): | ||
fname = fname[:-3] | ||||
csaba.henk@creo.hu
|
r4652 | flags = 0 | ||
if fname: | ||||
flags = gzip.FNAME | ||||
self.fileobj.write(chr(flags)) | ||||
gzip.write32u(self.fileobj, long(self.timestamp)) | ||||
self.fileobj.write('\002') | ||||
self.fileobj.write('\377') | ||||
if fname: | ||||
self.fileobj.write(fname + '\000') | ||||
Martin Geisler
|
r11558 | def __init__(self, dest, mtime, kind=''): | ||
Vadim Gelfer
|
r2477 | self.mtime = mtime | ||
Dan Villiom Podlaski Christiansen
|
r13400 | self.fileobj = None | ||
csaba.henk@creo.hu
|
r4652 | |||
Augie Fackler
|
r30479 | def taropen(mode, name='', fileobj=None): | ||
csaba.henk@creo.hu
|
r4652 | if kind == 'gz': | ||
Pulkit Goyal
|
r36465 | mode = mode[0:1] | ||
csaba.henk@creo.hu
|
r4652 | if not fileobj: | ||
csaba.henk@creo.hu
|
r4731 | fileobj = open(name, mode + 'b') | ||
csaba.henk@creo.hu
|
r4652 | gzfileobj = self.GzipFileWithTime(name, mode + 'b', | ||
zlib.Z_BEST_COMPRESSION, | ||||
fileobj, timestamp=mtime) | ||||
Dan Villiom Podlaski Christiansen
|
r13400 | self.fileobj = gzfileobj | ||
csaba.henk@creo.hu
|
r4652 | return tarfile.TarFile.taropen(name, mode, gzfileobj) | ||
else: | ||||
return tarfile.open(name, mode + kind, fileobj) | ||||
Vadim Gelfer
|
r2112 | if isinstance(dest, str): | ||
Augie Fackler
|
r30479 | self.z = taropen('w:', name=dest) | ||
Vadim Gelfer
|
r2112 | else: | ||
Augie Fackler
|
r30479 | self.z = taropen('w|', fileobj=dest) | ||
Vadim Gelfer
|
r2112 | |||
Alexis S. L. Carvalho
|
r4831 | def addfile(self, name, mode, islink, data): | ||
Martin Geisler
|
r11558 | i = tarfile.TarInfo(name) | ||
Vadim Gelfer
|
r2112 | i.mtime = self.mtime | ||
i.size = len(data) | ||||
Alexis S. L. Carvalho
|
r4831 | if islink: | ||
i.type = tarfile.SYMTYPE | ||||
Gregory Szorc
|
r25658 | i.mode = 0o777 | ||
Alexis S. L. Carvalho
|
r4831 | i.linkname = data | ||
data = None | ||||
Peter van Dijk
|
r7770 | i.size = 0 | ||
Alexis S. L. Carvalho
|
r4831 | else: | ||
i.mode = mode | ||||
timeless
|
r28861 | data = stringio(data) | ||
Alexis S. L. Carvalho
|
r4831 | self.z.addfile(i, data) | ||
Vadim Gelfer
|
r2112 | |||
def done(self): | ||||
self.z.close() | ||||
Dan Villiom Podlaski Christiansen
|
r13400 | if self.fileobj: | ||
self.fileobj.close() | ||||
Vadim Gelfer
|
r2112 | |||
Benoit Boissinot
|
r8778 | class tellable(object): | ||
Vadim Gelfer
|
r2112 | '''provide tell method for zipfile.ZipFile when writing to http | ||
response file object.''' | ||||
def __init__(self, fp): | ||||
self.fp = fp | ||||
self.offset = 0 | ||||
def __getattr__(self, key): | ||||
return getattr(self.fp, key) | ||||
def write(self, s): | ||||
self.fp.write(s) | ||||
self.offset += len(s) | ||||
def tell(self): | ||||
return self.offset | ||||
Benoit Boissinot
|
r8778 | class zipit(object): | ||
Vadim Gelfer
|
r2112 | '''write archive to zip file or stream. can write uncompressed, | ||
or compressed with deflate.''' | ||||
Martin Geisler
|
r11558 | def __init__(self, dest, mtime, compress=True): | ||
Colin McMillen
|
r2168 | if not isinstance(dest, str): | ||
try: | ||||
dest.tell() | ||||
Thomas Arendsen Hein
|
r2169 | except (AttributeError, IOError): | ||
Colin McMillen
|
r2168 | dest = tellable(dest) | ||
Gregory Szorc
|
r36053 | self.z = zipfile.ZipFile(dest, r'w', | ||
Vadim Gelfer
|
r2112 | compress and zipfile.ZIP_DEFLATED or | ||
zipfile.ZIP_STORED) | ||||
Martin Geisler
|
r12319 | |||
# Python's zipfile module emits deprecation warnings if we try | ||||
# to store files with a date before 1980. | ||||
epoch = 315532800 # calendar.timegm((1980, 1, 1, 0, 0, 0, 1, 1, 0)) | ||||
if mtime < epoch: | ||||
mtime = epoch | ||||
FUJIWARA Katsunori
|
r17628 | self.mtime = mtime | ||
Vadim Gelfer
|
r2477 | self.date_time = time.gmtime(mtime)[:6] | ||
Vadim Gelfer
|
r2112 | |||
Alexis S. L. Carvalho
|
r4831 | def addfile(self, name, mode, islink, data): | ||
Martin Geisler
|
r11558 | i = zipfile.ZipInfo(name, self.date_time) | ||
Vadim Gelfer
|
r2112 | i.compress_type = self.z.compression | ||
# unzip will not honor unix file modes unless file creator is | ||||
# set to unix (id 3). | ||||
i.create_system = 3 | ||||
Mads Kiilerich
|
r17429 | ftype = _UNX_IFREG | ||
Alexis S. L. Carvalho
|
r4831 | if islink: | ||
Gregory Szorc
|
r25658 | mode = 0o777 | ||
Mads Kiilerich
|
r17429 | ftype = _UNX_IFLNK | ||
Pulkit Goyal
|
r29890 | i.external_attr = (mode | ftype) << 16 | ||
FUJIWARA Katsunori
|
r17628 | # add "extended-timestamp" extra block, because zip archives | ||
# without this will be extracted with unexpected timestamp, | ||||
# if TZ is not configured as GMT | ||||
i.extra += struct.pack('<hhBl', | ||||
0x5455, # block type: "extended-timestamp" | ||||
1 + 4, # size of this block | ||||
1, # "modification time is present" | ||||
Mads Kiilerich
|
r18301 | int(self.mtime)) # last modification (UTC) | ||
Vadim Gelfer
|
r2112 | self.z.writestr(i, data) | ||
def done(self): | ||||
self.z.close() | ||||
Benoit Boissinot
|
r8778 | class fileit(object): | ||
Vadim Gelfer
|
r2112 | '''write archive as files in directory.''' | ||
Martin Geisler
|
r11558 | def __init__(self, name, mtime): | ||
Vadim Gelfer
|
r2112 | self.basedir = name | ||
Pierre-Yves David
|
r31235 | self.opener = vfsmod.vfs(self.basedir) | ||
James May
|
r35203 | self.mtime = mtime | ||
Vadim Gelfer
|
r2112 | |||
Alexis S. L. Carvalho
|
r4831 | def addfile(self, name, mode, islink, data): | ||
if islink: | ||||
self.opener.symlink(data, name) | ||||
return | ||||
Alexis S. L. Carvalho
|
r4830 | f = self.opener(name, "w", atomictemp=True) | ||
f.write(data) | ||||
Greg Ward
|
r15057 | f.close() | ||
Vadim Gelfer
|
r2112 | destfile = os.path.join(self.basedir, name) | ||
Alexis S. L. Carvalho
|
r4830 | os.chmod(destfile, mode) | ||
James May
|
r35203 | if self.mtime is not None: | ||
os.utime(destfile, (self.mtime, self.mtime)) | ||||
Vadim Gelfer
|
r2112 | |||
def done(self): | ||||
pass | ||||
archivers = { | ||||
'files': fileit, | ||||
'tar': tarit, | ||||
Martin Geisler
|
r11558 | 'tbz2': lambda name, mtime: tarit(name, mtime, 'bz2'), | ||
'tgz': lambda name, mtime: tarit(name, mtime, 'gz'), | ||||
'uzip': lambda name, mtime: zipit(name, mtime, False), | ||||
Vadim Gelfer
|
r2112 | 'zip': zipit, | ||
} | ||||
def archive(repo, dest, node, kind, decode=True, matchfn=None, | ||||
Matt Harbison
|
r24172 | prefix='', mtime=None, subrepos=False): | ||
Vadim Gelfer
|
r2112 | '''create archive of repo as it was at node. | ||
dest can be name of directory, name of archive file, or file | ||||
object to write archive to. | ||||
kind is type of archive to create. | ||||
decode tells whether to put files through decode filters from | ||||
hgrc. | ||||
matchfn is function to filter names of files to write to archive. | ||||
James May
|
r35203 | prefix is name of path to put before every archive member. | ||
mtime is the modified time, in seconds, or None to use the changeset time. | ||||
subrepos tells whether to include subrepos. | ||||
''' | ||||
Vadim Gelfer
|
r2112 | |||
Martin Geisler
|
r11558 | if kind == 'files': | ||
if prefix: | ||||
Pierre-Yves David
|
r26587 | raise error.Abort(_('cannot give prefix when archiving to files')) | ||
Martin Geisler
|
r11558 | else: | ||
prefix = tidyprefix(dest, kind, prefix) | ||||
Alexis S. L. Carvalho
|
r4951 | def write(name, mode, islink, getdata): | ||
data = getdata() | ||||
Vadim Gelfer
|
r2112 | if decode: | ||
Matt Mackall
|
r4005 | data = repo.wwritedata(name, data) | ||
Martin Geisler
|
r11558 | archiver.addfile(prefix + name, mode, islink, data) | ||
Vadim Gelfer
|
r2112 | |||
Dirkjan Ochtman
|
r6019 | if kind not in archivers: | ||
Pierre-Yves David
|
r26587 | raise error.Abort(_("unknown archive type '%s'") % kind) | ||
Matt Mackall
|
r6749 | |||
ctx = repo[node] | ||||
Martin Geisler
|
r11558 | archiver = archivers[kind](dest, mtime or ctx.date()[0]) | ||
Matt Mackall
|
r6749 | |||
Jun Wu
|
r33499 | if repo.ui.configbool("ui", "archivemeta"): | ||
Thomas Arendsen Hein
|
r16919 | name = '.hg_archival.txt' | ||
if not matchfn or matchfn(name): | ||||
Gregory Szorc
|
r25658 | write(name, 0o644, False, lambda: buildmetadata(ctx)) | ||
Gilles Moris
|
r9614 | |||
Thomas Arendsen Hein
|
r16919 | if matchfn: | ||
files = [f for f in ctx.manifest().keys() if matchfn(f)] | ||||
else: | ||||
files = ctx.manifest().keys() | ||||
total = len(files) | ||||
Angel Ezquerra
|
r18967 | if total: | ||
files.sort() | ||||
Matt Harbison
|
r36156 | scmutil.fileprefetchhooks(repo, ctx, files) | ||
Angel Ezquerra
|
r18967 | repo.ui.progress(_('archiving'), 0, unit=_('files'), total=total) | ||
for i, f in enumerate(files): | ||||
ff = ctx.flags(f) | ||||
Gregory Szorc
|
r25658 | write(f, 'x' in ff and 0o755 or 0o644, 'l' in ff, ctx[f].data) | ||
Angel Ezquerra
|
r18967 | repo.ui.progress(_('archiving'), i + 1, item=f, | ||
unit=_('files'), total=total) | ||||
repo.ui.progress(_('archiving'), None) | ||||
Martin Geisler
|
r12323 | |||
if subrepos: | ||||
Mads Kiilerich
|
r18364 | for subpath in sorted(ctx.substate): | ||
Matt Harbison
|
r25601 | sub = ctx.workingsub(subpath) | ||
Martin von Zweigbergk
|
r28017 | submatch = matchmod.subdirmatcher(subpath, matchfn) | ||
Matt Harbison
|
r31099 | total += sub.archive(archiver, prefix, submatch, decode) | ||
Angel Ezquerra
|
r18967 | |||
if total == 0: | ||||
raise error.Abort(_('no files match the archive pattern')) | ||||
Martin Geisler
|
r12323 | |||
Vadim Gelfer
|
r2112 | archiver.done() | ||
Angel Ezquerra
|
r18967 | return total | ||