gnuarch.py
353 lines
| 12.7 KiB
| text/x-python
|
PythonLexer
Martin Geisler
|
r8250 | # gnuarch.py - GNU Arch support for the convert extension | ||
# | ||||
# Copyright 2008, 2009 Aleix Conchillo Flaque <aleix@member.fsf.org> | ||||
# and others | ||||
# | ||||
# This software may be used and distributed according to the terms of the | ||||
Matt Mackall
|
r10263 | # GNU General Public License version 2 or any later version. | ||
timeless
|
r28366 | from __future__ import absolute_import | ||
Aleix Conchillo Flaque
|
r6035 | |||
Pulkit Goyal
|
r35651 | import email.parser as emailparser | ||
timeless
|
r28366 | import os | ||
import shutil | ||||
import stat | ||||
import tempfile | ||||
Yuya Nishihara
|
r29205 | |||
from mercurial.i18n import _ | ||||
timeless
|
r28366 | from mercurial import ( | ||
encoding, | ||||
error, | ||||
util, | ||||
) | ||||
Boris Feld
|
r36625 | from mercurial.utils import dateutil | ||
timeless
|
r28366 | from . import common | ||
Aleix Conchillo Flaque
|
r6035 | |||
timeless
|
r28366 | class gnuarch_source(common.converter_source, common.commandline): | ||
Aleix Conchillo Flaque
|
r6035 | |||
Benoit Boissinot
|
r8778 | class gnuarch_rev(object): | ||
Aleix Conchillo Flaque
|
r6035 | def __init__(self, rev): | ||
self.rev = rev | ||||
self.summary = '' | ||||
self.date = None | ||||
self.author = '' | ||||
Edouard Gomez
|
r7583 | self.continuationof = None | ||
Aleix Conchillo Flaque
|
r6035 | self.add_files = [] | ||
self.mod_files = [] | ||||
self.del_files = [] | ||||
self.ren_files = {} | ||||
self.ren_dirs = {} | ||||
Matt Harbison
|
r35168 | def __init__(self, ui, repotype, path, revs=None): | ||
super(gnuarch_source, self).__init__(ui, repotype, path, revs=revs) | ||||
Aleix Conchillo Flaque
|
r6035 | |||
if not os.path.exists(os.path.join(path, '{arch}')): | ||||
timeless
|
r28366 | raise common.NoRepo(_("%s does not look like a GNU Arch repository") | ||
Martin Geisler
|
r10938 | % path) | ||
Aleix Conchillo Flaque
|
r6035 | |||
# Could use checktool, but we want to check for baz or tla. | ||||
self.execmd = None | ||||
Adrian Buehlmann
|
r14271 | if util.findexe('baz'): | ||
Patrick Mezard
|
r6083 | self.execmd = 'baz' | ||
Aleix Conchillo Flaque
|
r6035 | else: | ||
Adrian Buehlmann
|
r14271 | if util.findexe('tla'): | ||
Patrick Mezard
|
r6083 | self.execmd = 'tla' | ||
Aleix Conchillo Flaque
|
r6035 | else: | ||
Pierre-Yves David
|
r26587 | raise error.Abort(_('cannot find a GNU Arch tool')) | ||
Aleix Conchillo Flaque
|
r6035 | |||
timeless
|
r28366 | common.commandline.__init__(self, ui, self.execmd) | ||
Aleix Conchillo Flaque
|
r6035 | |||
Matt Mackall
|
r15381 | self.path = os.path.realpath(path) | ||
Aleix Conchillo Flaque
|
r6035 | self.tmppath = None | ||
self.treeversion = None | ||||
self.lastrev = None | ||||
self.changes = {} | ||||
self.parents = {} | ||||
self.tags = {} | ||||
Pulkit Goyal
|
r35651 | self.catlogparser = emailparser.Parser() | ||
Brodie Rao
|
r11987 | self.encoding = encoding.encoding | ||
Edouard Gomez
|
r7584 | self.archives = [] | ||
Aleix Conchillo Flaque
|
r6035 | |||
def before(self): | ||||
Edouard Gomez
|
r7584 | # Get registered archives | ||
self.archives = [i.rstrip('\n') | ||||
for i in self.runlines0('archives', '-n')] | ||||
Aleix Conchillo Flaque
|
r6035 | if self.execmd == 'tla': | ||
output = self.run0('tree-version', self.path) | ||||
else: | ||||
output = self.run0('tree-version', '-d', self.path) | ||||
self.treeversion = output.strip() | ||||
# Get name of temporary directory | ||||
version = self.treeversion.split('/') | ||||
self.tmppath = os.path.join(tempfile.gettempdir(), | ||||
'hg-%s' % version[1]) | ||||
# Generate parents dictionary | ||||
Edouard Gomez
|
r7585 | self.parents[None] = [] | ||
treeversion = self.treeversion | ||||
child = None | ||||
while treeversion: | ||||
self.ui.status(_('analyzing tree version %s...\n') % treeversion) | ||||
archive = treeversion.split('/')[0] | ||||
if archive not in self.archives: | ||||
Martin Geisler
|
r8662 | self.ui.status(_('tree analysis stopped because it points to ' | ||
'an unregistered archive %s...\n') % archive) | ||||
Edouard Gomez
|
r7585 | break | ||
# Get the complete list of revisions for that tree version | ||||
output, status = self.runlines('revisions', '-r', '-f', treeversion) | ||||
Mads Kiilerich
|
r17424 | self.checkexit(status, 'failed retrieving revisions for %s' | ||
Matt Mackall
|
r10282 | % treeversion) | ||
Edouard Gomez
|
r7585 | |||
# No new iteration unless a revision has a continuation-of header | ||||
treeversion = None | ||||
for l in output: | ||||
rev = l.strip() | ||||
self.changes[rev] = self.gnuarch_rev(rev) | ||||
self.parents[rev] = [] | ||||
Aleix Conchillo Flaque
|
r6035 | |||
Edouard Gomez
|
r7585 | # Read author, date and summary | ||
catlog, status = self.run('cat-log', '-d', self.path, rev) | ||||
if status: | ||||
catlog = self.run0('cat-archive-log', rev) | ||||
self._parsecatlog(catlog, rev) | ||||
# Populate the parents map | ||||
self.parents[child].append(rev) | ||||
Aleix Conchillo Flaque
|
r6035 | |||
Edouard Gomez
|
r7585 | # Keep track of the current revision as the child of the next | ||
# revision scanned | ||||
child = rev | ||||
# Check if we have to follow the usual incremental history | ||||
# or if we have to 'jump' to a different treeversion given | ||||
# by the continuation-of header. | ||||
if self.changes[rev].continuationof: | ||||
Matt Mackall
|
r10282 | treeversion = '--'.join( | ||
self.changes[rev].continuationof.split('--')[:-1]) | ||||
Edouard Gomez
|
r7585 | break | ||
# If we reached a base-0 revision w/o any continuation-of | ||||
# header, it means the tree history ends here. | ||||
if rev[-6:] == 'base-0': | ||||
break | ||||
Aleix Conchillo Flaque
|
r6035 | |||
def after(self): | ||||
Martin Geisler
|
r9467 | self.ui.debug('cleaning up %s\n' % self.tmppath) | ||
Aleix Conchillo Flaque
|
r6035 | shutil.rmtree(self.tmppath, ignore_errors=True) | ||
def getheads(self): | ||||
return self.parents[None] | ||||
def getfile(self, name, rev): | ||||
if rev != self.lastrev: | ||||
Pierre-Yves David
|
r26587 | raise error.Abort(_('internal calling inconsistency')) | ||
Aleix Conchillo Flaque
|
r6035 | |||
Patrick Mezard
|
r12344 | if not os.path.lexists(os.path.join(self.tmppath, name)): | ||
Mads Kiilerich
|
r22296 | return None, None | ||
Aleix Conchillo Flaque
|
r6035 | |||
Patrick Mezard
|
r11134 | return self._getfile(name, rev) | ||
Aleix Conchillo Flaque
|
r6035 | |||
Mads Kiilerich
|
r22300 | def getchanges(self, rev, full): | ||
if full: | ||||
timeless@mozdev.org
|
r26779 | raise error.Abort(_("convert from arch does not support --full")) | ||
Aleix Conchillo Flaque
|
r6035 | self._update(rev) | ||
changes = [] | ||||
copies = {} | ||||
for f in self.changes[rev].add_files: | ||||
changes.append((f, rev)) | ||||
for f in self.changes[rev].mod_files: | ||||
changes.append((f, rev)) | ||||
for f in self.changes[rev].del_files: | ||||
changes.append((f, rev)) | ||||
for src in self.changes[rev].ren_files: | ||||
to = self.changes[rev].ren_files[src] | ||||
changes.append((src, rev)) | ||||
changes.append((to, rev)) | ||||
Patrick Mezard
|
r7567 | copies[to] = src | ||
Aleix Conchillo Flaque
|
r6035 | |||
for src in self.changes[rev].ren_dirs: | ||||
to = self.changes[rev].ren_dirs[src] | ||||
Benoit Boissinot
|
r10394 | chgs, cps = self._rendirchanges(src, to) | ||
Aleix Conchillo Flaque
|
r6035 | changes += [(f, rev) for f in chgs] | ||
Patrick Mezard
|
r7567 | copies.update(cps) | ||
Aleix Conchillo Flaque
|
r6035 | |||
self.lastrev = rev | ||||
Mads Kiilerich
|
r24395 | return sorted(set(changes)), copies, set() | ||
Aleix Conchillo Flaque
|
r6035 | |||
def getcommit(self, rev): | ||||
changes = self.changes[rev] | ||||
timeless
|
r28366 | return common.commit(author=changes.author, date=changes.date, | ||
desc=changes.summary, parents=self.parents[rev], | ||||
rev=rev) | ||||
Aleix Conchillo Flaque
|
r6035 | |||
def gettags(self): | ||||
return self.tags | ||||
def _execute(self, cmd, *args, **kwargs): | ||||
cmdline = [self.execmd, cmd] | ||||
cmdline += args | ||||
cmdline = [util.shellquote(arg) for arg in cmdline] | ||||
Ross Lagerwall
|
r17391 | cmdline += ['>', os.devnull, '2>', os.devnull] | ||
Aleix Conchillo Flaque
|
r6035 | cmdline = util.quotecommand(' '.join(cmdline)) | ||
self.ui.debug(cmdline, '\n') | ||||
return os.system(cmdline) | ||||
def _update(self, rev): | ||||
Martin Geisler
|
r9467 | self.ui.debug('applying revision %s...\n' % rev) | ||
Edouard Gomez
|
r7585 | changeset, status = self.runlines('replay', '-d', self.tmppath, | ||
rev) | ||||
if status: | ||||
# Something went wrong while merging (baz or tla | ||||
# issue?), get latest revision and try from there | ||||
shutil.rmtree(self.tmppath, ignore_errors=True) | ||||
Aleix Conchillo Flaque
|
r6049 | self._obtainrevision(rev) | ||
Aleix Conchillo Flaque
|
r6035 | else: | ||
Edouard Gomez
|
r7585 | old_rev = self.parents[rev][0] | ||
Martin Geisler
|
r9467 | self.ui.debug('computing changeset between %s and %s...\n' | ||
Edouard Gomez
|
r7585 | % (old_rev, rev)) | ||
self._parsechangeset(changeset, rev) | ||||
Aleix Conchillo Flaque
|
r6035 | |||
def _getfile(self, name, rev): | ||||
mode = os.lstat(os.path.join(self.tmppath, name)).st_mode | ||||
if stat.S_ISLNK(mode): | ||||
data = os.readlink(os.path.join(self.tmppath, name)) | ||||
Jordi Gutiérrez Hermoso
|
r24306 | if mode: | ||
mode = 'l' | ||||
else: | ||||
mode = '' | ||||
Aleix Conchillo Flaque
|
r6035 | else: | ||
data = open(os.path.join(self.tmppath, name), 'rb').read() | ||||
Gregory Szorc
|
r25658 | mode = (mode & 0o111) and 'x' or '' | ||
Aleix Conchillo Flaque
|
r6035 | return data, mode | ||
def _exclude(self, name): | ||||
Matt Mackall
|
r10282 | exclude = ['{arch}', '.arch-ids', '.arch-inventory'] | ||
Aleix Conchillo Flaque
|
r6035 | for exc in exclude: | ||
if name.find(exc) != -1: | ||||
return True | ||||
return False | ||||
def _readcontents(self, path): | ||||
files = [] | ||||
contents = os.listdir(path) | ||||
while len(contents) > 0: | ||||
c = contents.pop() | ||||
p = os.path.join(path, c) | ||||
Aleix Conchillo Flaque
|
r6044 | # os.walk could be used, but here we avoid internal GNU | ||
# Arch files and directories, thus saving a lot time. | ||||
Aleix Conchillo Flaque
|
r6035 | if not self._exclude(p): | ||
if os.path.isdir(p): | ||||
contents += [os.path.join(c, f) for f in os.listdir(p)] | ||||
else: | ||||
files.append(c) | ||||
return files | ||||
def _rendirchanges(self, src, dest): | ||||
changes = [] | ||||
copies = {} | ||||
files = self._readcontents(os.path.join(self.tmppath, dest)) | ||||
for f in files: | ||||
s = os.path.join(src, f) | ||||
d = os.path.join(dest, f) | ||||
changes.append(s) | ||||
changes.append(d) | ||||
Patrick Mezard
|
r7567 | copies[d] = s | ||
Aleix Conchillo Flaque
|
r6035 | return changes, copies | ||
Aleix Conchillo Flaque
|
r6049 | def _obtainrevision(self, rev): | ||
Martin Geisler
|
r9467 | self.ui.debug('obtaining revision %s...\n' % rev) | ||
Edouard Gomez
|
r7582 | output = self._execute('get', rev, self.tmppath) | ||
Aleix Conchillo Flaque
|
r6049 | self.checkexit(output) | ||
Martin Geisler
|
r9467 | self.ui.debug('analyzing revision %s...\n' % rev) | ||
Aleix Conchillo Flaque
|
r6049 | files = self._readcontents(self.tmppath) | ||
self.changes[rev].add_files += files | ||||
Aleix Conchillo Flaque
|
r6079 | def _stripbasepath(self, path): | ||
if path.startswith('./'): | ||||
return path[2:] | ||||
return path | ||||
Aleix Conchillo Flaque
|
r6035 | def _parsecatlog(self, data, rev): | ||
Edouard Gomez
|
r7578 | try: | ||
catlog = self.catlogparser.parsestr(data) | ||||
Edouard Gomez
|
r7592 | |||
# Commit date | ||||
Boris Feld
|
r36625 | self.changes[rev].date = dateutil.datestr( | ||
dateutil.strdate(catlog['Standard-date'], | ||||
Edouard Gomez
|
r7578 | '%Y-%m-%d %H:%M:%S')) | ||
Edouard Gomez
|
r7592 | |||
# Commit author | ||||
self.changes[rev].author = self.recode(catlog['Creator']) | ||||
# Commit description | ||||
self.changes[rev].summary = '\n\n'.join((catlog['Summary'], | ||||
catlog.get_payload())) | ||||
self.changes[rev].summary = self.recode(self.changes[rev].summary) | ||||
# Commit revision origin when dealing with a branch or tag | ||||
Nicolas Dumazet
|
r9391 | if 'Continuation-of' in catlog: | ||
Matt Mackall
|
r10282 | self.changes[rev].continuationof = self.recode( | ||
catlog['Continuation-of']) | ||||
Peter Arrenbrecht
|
r7875 | except Exception: | ||
Pierre-Yves David
|
r26587 | raise error.Abort(_('could not parse cat-log of %s') % rev) | ||
Aleix Conchillo Flaque
|
r6037 | |||
Aleix Conchillo Flaque
|
r6049 | def _parsechangeset(self, data, rev): | ||
Aleix Conchillo Flaque
|
r6035 | for l in data: | ||
l = l.strip() | ||||
Aleix Conchillo Flaque
|
r6055 | # Added file (ignore added directory) | ||
Aleix Conchillo Flaque
|
r6035 | if l.startswith('A') and not l.startswith('A/'): | ||
Aleix Conchillo Flaque
|
r6079 | file = self._stripbasepath(l[1:].strip()) | ||
Aleix Conchillo Flaque
|
r6035 | if not self._exclude(file): | ||
self.changes[rev].add_files.append(file) | ||||
Aleix Conchillo Flaque
|
r6055 | # Deleted file (ignore deleted directory) | ||
elif l.startswith('D') and not l.startswith('D/'): | ||||
Aleix Conchillo Flaque
|
r6079 | file = self._stripbasepath(l[1:].strip()) | ||
Aleix Conchillo Flaque
|
r6055 | if not self._exclude(file): | ||
self.changes[rev].del_files.append(file) | ||||
# Modified binary file | ||||
elif l.startswith('Mb'): | ||||
Aleix Conchillo Flaque
|
r6079 | file = self._stripbasepath(l[2:].strip()) | ||
Aleix Conchillo Flaque
|
r6055 | if not self._exclude(file): | ||
self.changes[rev].mod_files.append(file) | ||||
# Modified link | ||||
elif l.startswith('M->'): | ||||
Aleix Conchillo Flaque
|
r6079 | file = self._stripbasepath(l[3:].strip()) | ||
Aleix Conchillo Flaque
|
r6055 | if not self._exclude(file): | ||
self.changes[rev].mod_files.append(file) | ||||
# Modified file | ||||
elif l.startswith('M'): | ||||
Aleix Conchillo Flaque
|
r6079 | file = self._stripbasepath(l[1:].strip()) | ||
Aleix Conchillo Flaque
|
r6055 | if not self._exclude(file): | ||
self.changes[rev].mod_files.append(file) | ||||
# Renamed file (or link) | ||||
elif l.startswith('=>'): | ||||
files = l[2:].strip().split(' ') | ||||
if len(files) == 1: | ||||
files = l[2:].strip().split('\t') | ||||
Aleix Conchillo Flaque
|
r6079 | src = self._stripbasepath(files[0]) | ||
dst = self._stripbasepath(files[1]) | ||||
if not self._exclude(src) and not self._exclude(dst): | ||||
self.changes[rev].ren_files[src] = dst | ||||
Aleix Conchillo Flaque
|
r6055 | # Conversion from file to link or from link to file (modified) | ||
elif l.startswith('ch'): | ||||
Aleix Conchillo Flaque
|
r6079 | file = self._stripbasepath(l[2:].strip()) | ||
Aleix Conchillo Flaque
|
r6055 | if not self._exclude(file): | ||
self.changes[rev].mod_files.append(file) | ||||
# Renamed directory | ||||
Aleix Conchillo Flaque
|
r6035 | elif l.startswith('/>'): | ||
dirs = l[2:].strip().split(' ') | ||||
if len(dirs) == 1: | ||||
dirs = l[2:].strip().split('\t') | ||||
Aleix Conchillo Flaque
|
r6079 | src = self._stripbasepath(dirs[0]) | ||
dst = self._stripbasepath(dirs[1]) | ||||
if not self._exclude(src) and not self._exclude(dst): | ||||
self.changes[rev].ren_dirs[src] = dst | ||||