subversion.py
1740 lines
| 60.8 KiB
| text/x-python
|
PythonLexer
Daniel Holth
|
r4765 | # Subversion 1.4/1.5 Python API backend | ||
# | ||||
# Copyright(C) 2007 Daniel Holth et al | ||||
Manuel Jacob
|
r45561 | import codecs | ||
import locale | ||||
timeless
|
r28408 | import os | ||
Gregory Szorc
|
r49725 | import pickle | ||
timeless
|
r28408 | import re | ||
Augie Fackler
|
r19787 | import xml.dom.minidom | ||
Bryan O'Sullivan
|
r5513 | |||
Yuya Nishihara
|
r29205 | from mercurial.i18n import _ | ||
Gregory Szorc
|
r43355 | from mercurial.pycompat import open | ||
timeless
|
r28408 | from mercurial import ( | ||
encoding, | ||||
error, | ||||
Pulkit Goyal
|
r30519 | pycompat, | ||
timeless
|
r28408 | util, | ||
Pierre-Yves David
|
r31246 | vfs as vfsmod, | ||
timeless
|
r28408 | ) | ||
Yuya Nishihara
|
r37102 | from mercurial.utils import ( | ||
dateutil, | ||||
Yuya Nishihara
|
r37138 | procutil, | ||
Yuya Nishihara
|
r37102 | stringutil, | ||
) | ||||
Daniel Holth
|
r4765 | |||
timeless
|
r28408 | from . import common | ||
timeless
|
r28861 | stringio = util.stringio | ||
Patrick Mezard
|
r16511 | propertycache = util.propertycache | ||
timeless
|
r28883 | urlerr = util.urlerr | ||
urlreq = util.urlreq | ||||
Patrick Mezard
|
r16511 | |||
timeless
|
r28408 | commandline = common.commandline | ||
commit = common.commit | ||||
converter_sink = common.converter_sink | ||||
converter_source = common.converter_source | ||||
decodeargs = common.decodeargs | ||||
encodeargs = common.encodeargs | ||||
makedatetimestamp = common.makedatetimestamp | ||||
mapfile = common.mapfile | ||||
MissingTool = common.MissingTool | ||||
NoRepo = common.NoRepo | ||||
Daniel Holth
|
r4765 | # Subversion stuff. Works best with very recent Python SVN bindings | ||
# e.g. SVN 1.5 or backports. Thanks to the bzr folks for enhancing | ||||
# these bindings. | ||||
Brendan Cully
|
r4766 | try: | ||
Brendan Cully
|
r5010 | import svn | ||
import svn.client | ||||
Brendan Cully
|
r4766 | import svn.core | ||
import svn.ra | ||||
import svn.delta | ||||
FUJIWARA Katsunori
|
r28459 | from . import transport | ||
Ronny Pfannschmidt
|
r8221 | import warnings | ||
Augie Fackler
|
r43346 | |||
warnings.filterwarnings( | ||||
Manuel Jacob
|
r45490 | 'ignore', module='svn.core', category=DeprecationWarning | ||
Augie Fackler
|
r43346 | ) | ||
svn.core.SubversionException # trigger import to catch error | ||||
Ronny Pfannschmidt
|
r8221 | |||
Brendan Cully
|
r4766 | except ImportError: | ||
Azhagu Selvan SP
|
r13480 | svn = None | ||
Daniel Holth
|
r4765 | |||
Augie Fackler
|
r43346 | |||
Manuel Jacob
|
r45562 | # In Subversion, paths and URLs are Unicode (encoded as UTF-8), which | ||
# Subversion converts from / to native strings when interfacing with the OS. | ||||
# When passing paths and URLs to Subversion, we have to recode them such that | ||||
# it roundstrips with what Subversion is doing. | ||||
Manuel Jacob
|
r45561 | |||
fsencoding = None | ||||
def init_fsencoding(): | ||||
global fsencoding, fsencoding_is_utf8 | ||||
if fsencoding is not None: | ||||
return | ||||
if pycompat.iswindows: | ||||
# On Windows, filenames are Unicode, but we store them using the MBCS | ||||
# encoding. | ||||
fsencoding = 'mbcs' | ||||
else: | ||||
# This is the encoding used to convert UTF-8 back to natively-encoded | ||||
# strings in Subversion 1.14.0 or earlier with APR 1.7.0 or earlier. | ||||
with util.with_lc_ctype(): | ||||
fsencoding = locale.nl_langinfo(locale.CODESET) or 'ISO-8859-1' | ||||
fsencoding = codecs.lookup(fsencoding).name | ||||
fsencoding_is_utf8 = fsencoding == codecs.lookup('utf-8').name | ||||
def fs2svn(s): | ||||
if fsencoding_is_utf8: | ||||
return s | ||||
else: | ||||
return s.decode(fsencoding).encode('utf-8') | ||||
Nikita Slyusarev
|
r47129 | def formatsvndate(date): | ||
return dateutil.datestr(date, b'%Y-%m-%dT%H:%M:%S.000000Z') | ||||
def parsesvndate(s): | ||||
# Example SVN datetime. Includes microseconds. | ||||
# ISO-8601 conformant | ||||
# '2007-01-04T17:35:00.902377Z' | ||||
return dateutil.parsedate(s[:19] + b' UTC', [b'%Y-%m-%dT%H:%M:%S']) | ||||
Patrick Mezard
|
r7381 | class SvnPathNotFound(Exception): | ||
pass | ||||
Augie Fackler
|
r43346 | |||
Patrick Mezard
|
r13690 | def revsplit(rev): | ||
Mads Kiilerich
|
r20419 | """Parse a revision string and return (uuid, path, revnum). | ||
Yuya Nishihara
|
r34133 | >>> revsplit(b'svn:a2147622-4a9f-4db4-a8d3-13562ff547b2' | ||
... b'/proj%20B/mytrunk/mytrunk@1') | ||||
Mads Kiilerich
|
r20419 | ('a2147622-4a9f-4db4-a8d3-13562ff547b2', '/proj%20B/mytrunk/mytrunk', 1) | ||
Yuya Nishihara
|
r34133 | >>> revsplit(b'svn:8af66a51-67f5-4354-b62c-98d67cc7be1d@1') | ||
Mads Kiilerich
|
r20419 | ('', '', 1) | ||
Yuya Nishihara
|
r34133 | >>> revsplit(b'@7') | ||
Mads Kiilerich
|
r20419 | ('', '', 7) | ||
Yuya Nishihara
|
r34133 | >>> revsplit(b'7') | ||
Mads Kiilerich
|
r20419 | ('', '', 0) | ||
Yuya Nishihara
|
r34133 | >>> revsplit(b'bad') | ||
Mads Kiilerich
|
r20419 | ('', '', 0) | ||
""" | ||||
Augie Fackler
|
r43347 | parts = rev.rsplit(b'@', 1) | ||
Mads Kiilerich
|
r20419 | revnum = 0 | ||
if len(parts) > 1: | ||||
revnum = int(parts[1]) | ||||
Augie Fackler
|
r43347 | parts = parts[0].split(b'/', 1) | ||
uuid = b'' | ||||
mod = b'' | ||||
if len(parts) > 1 and parts[0].startswith(b'svn:'): | ||||
Mads Kiilerich
|
r20419 | uuid = parts[0][4:] | ||
Augie Fackler
|
r43347 | mod = b'/' + parts[1] | ||
Mads Kiilerich
|
r20419 | return uuid, mod, revnum | ||
Patrick Mezard
|
r13690 | |||
Augie Fackler
|
r43346 | |||
Patrick Mezard
|
r15599 | def quote(s): | ||
# As of svn 1.7, many svn calls expect "canonical" paths. In | ||||
# theory, we should call svn.core.*canonicalize() on all paths | ||||
# before passing them to the API. Instead, we assume the base url | ||||
# is canonical and copy the behaviour of svn URL encoding function | ||||
# so we can extend it safely with new components. The "safe" | ||||
# characters were taken from the "svn_uri__char_validity" table in | ||||
# libsvn_subr/path.c. | ||||
Augie Fackler
|
r43347 | return urlreq.quote(s, b"!$&'()*+,-./:=@_~") | ||
Patrick Mezard
|
r15599 | |||
Augie Fackler
|
r43346 | |||
Brendan Cully
|
r5008 | def geturl(path): | ||
Manuel Jacob
|
r45565 | """Convert path or URL to a SVN URL, encoded in UTF-8. | ||
This can raise UnicodeDecodeError if the path or URL can't be converted to | ||||
unicode using `fsencoding`. | ||||
""" | ||||
Brendan Cully
|
r5010 | try: | ||
Manuel Jacob
|
r45562 | return svn.client.url_from_path( | ||
svn.core.svn_path_canonicalize(fs2svn(path)) | ||||
) | ||||
FUJIWARA Katsunori
|
r28460 | except svn.core.SubversionException: | ||
Patrick Mezard
|
r15599 | # svn.client.url_from_path() fails with local repositories | ||
Brendan Cully
|
r5010 | pass | ||
Brendan Cully
|
r5008 | if os.path.isdir(path): | ||
r48434 | path = os.path.normpath(util.abspath(path)) | |||
Jun Wu
|
r34646 | if pycompat.iswindows: | ||
Augie Fackler
|
r43347 | path = b'/' + util.normpath(path) | ||
Patrick Mezard
|
r8886 | # Module URL is later compared with the repository URL returned | ||
# by svn API, which is UTF-8. | ||||
Manuel Jacob
|
r45561 | path = fs2svn(path) | ||
Augie Fackler
|
r43347 | path = b'file://%s' % quote(path) | ||
Patrick Mezard
|
r15599 | return svn.core.svn_path_canonicalize(path) | ||
Brendan Cully
|
r5008 | |||
Augie Fackler
|
r43346 | |||
Brendan Cully
|
r5117 | def optrev(number): | ||
optrev = svn.core.svn_opt_revision_t() | ||||
optrev.kind = svn.core.svn_opt_revision_number | ||||
optrev.value.number = number | ||||
return optrev | ||||
Augie Fackler
|
r43346 | |||
Bryan O'Sullivan
|
r4946 | class changedpath(object): | ||
def __init__(self, p): | ||||
self.copyfrom_path = p.copyfrom_path | ||||
self.copyfrom_rev = p.copyfrom_rev | ||||
self.action = p.action | ||||
Augie Fackler
|
r43346 | |||
def get_log_child( | ||||
fp, | ||||
url, | ||||
paths, | ||||
start, | ||||
end, | ||||
limit=0, | ||||
discover_changed_paths=True, | ||||
strict_node_history=False, | ||||
): | ||||
Patrick Mezard
|
r5127 | protocol = -1 | ||
Augie Fackler
|
r43346 | |||
Patrick Mezard
|
r5127 | def receiver(orig_paths, revnum, author, date, message, pool): | ||
Mads Kiilerich
|
r20057 | paths = {} | ||
Patrick Mezard
|
r5127 | if orig_paths is not None: | ||
Gregory Szorc
|
r49768 | for k, v in orig_paths.items(): | ||
Mads Kiilerich
|
r20057 | paths[k] = changedpath(v) | ||
Augie Fackler
|
r43346 | pickle.dump((paths, revnum, author, date, message), fp, protocol) | ||
Thomas Arendsen Hein
|
r5143 | |||
Patrick Mezard
|
r5127 | try: | ||
# Use an ra of our own so that our parent can consume | ||||
# our results without confusing the server. | ||||
t = transport.SvnRaTransport(url=url) | ||||
Augie Fackler
|
r43346 | svn.ra.get_log( | ||
t.ra, | ||||
paths, | ||||
start, | ||||
end, | ||||
limit, | ||||
discover_changed_paths, | ||||
strict_node_history, | ||||
receiver, | ||||
) | ||||
Patrick Mezard
|
r5873 | except IOError: | ||
# Caller may interrupt the iteration | ||||
pickle.dump(None, fp, protocol) | ||||
Gregory Szorc
|
r25660 | except Exception as inst: | ||
Yuya Nishihara
|
r37102 | pickle.dump(stringutil.forcebytestr(inst), fp, protocol) | ||
Patrick Mezard
|
r5127 | else: | ||
pickle.dump(None, fp, protocol) | ||||
Sascha Nemecek
|
r36529 | fp.flush() | ||
Patrick Mezard
|
r6397 | # With large history, cleanup process goes crazy and suddenly | ||
# consumes *huge* amount of memory. The output file being closed, | ||||
# there is no need for clean termination. | ||||
os._exit(0) | ||||
Patrick Mezard
|
r5127 | |||
Augie Fackler
|
r43346 | |||
Thomas Arendsen Hein
|
r5139 | def debugsvnlog(ui, **opts): | ||
"""Fetch SVN log in a subprocess and channel them back to parent to | ||||
avoid memory collection issues. | ||||
""" | ||||
Manuel Jacob
|
r45551 | with util.with_lc_ctype(): | ||
if svn is None: | ||||
raise error.Abort( | ||||
_(b'debugsvnlog could not load Subversion python bindings') | ||||
) | ||||
Mads Kiilerich
|
r17053 | |||
Manuel Jacob
|
r45551 | args = decodeargs(ui.fin.read()) | ||
get_log_child(ui.fout, *args) | ||||
Thomas Arendsen Hein
|
r5139 | |||
Augie Fackler
|
r43346 | |||
Benoit Boissinot
|
r8778 | class logstream(object): | ||
Patrick Mezard
|
r5873 | """Interruptible revision log iterator.""" | ||
Augie Fackler
|
r43346 | |||
Patrick Mezard
|
r5873 | def __init__(self, stdout): | ||
self._stdout = stdout | ||||
def __iter__(self): | ||||
while True: | ||||
Patrick Mezard
|
r9587 | try: | ||
entry = pickle.load(self._stdout) | ||||
except EOFError: | ||||
Augie Fackler
|
r43346 | raise error.Abort( | ||
_( | ||||
Augie Fackler
|
r43347 | b'Mercurial failed to run itself, check' | ||
b' hg executable is in PATH' | ||||
Augie Fackler
|
r43346 | ) | ||
) | ||||
Patrick Mezard
|
r5873 | try: | ||
orig_paths, revnum, author, date, message = entry | ||||
Brodie Rao
|
r16688 | except (TypeError, ValueError): | ||
Patrick Mezard
|
r5873 | if entry is None: | ||
break | ||||
Augie Fackler
|
r43347 | raise error.Abort(_(b"log stream exception '%s'") % entry) | ||
Patrick Mezard
|
r5873 | yield entry | ||
def close(self): | ||||
if self._stdout: | ||||
self._stdout.close() | ||||
self._stdout = None | ||||
Augie Fackler
|
r43346 | |||
Mads Kiilerich
|
r20420 | class directlogstream(list): | ||
"""Direct revision log iterator. | ||||
This can be used for debugging and development but it will probably leak | ||||
memory and is not suitable for real conversions.""" | ||||
Augie Fackler
|
r43346 | def __init__( | ||
self, | ||||
url, | ||||
paths, | ||||
start, | ||||
end, | ||||
limit=0, | ||||
discover_changed_paths=True, | ||||
strict_node_history=False, | ||||
): | ||||
Mads Kiilerich
|
r20420 | def receiver(orig_paths, revnum, author, date, message, pool): | ||
paths = {} | ||||
if orig_paths is not None: | ||||
Gregory Szorc
|
r49768 | for k, v in orig_paths.items(): | ||
Mads Kiilerich
|
r20420 | paths[k] = changedpath(v) | ||
self.append((paths, revnum, author, date, message)) | ||||
# Use an ra of our own so that our parent can consume | ||||
# our results without confusing the server. | ||||
t = transport.SvnRaTransport(url=url) | ||||
Augie Fackler
|
r43346 | svn.ra.get_log( | ||
t.ra, | ||||
paths, | ||||
start, | ||||
end, | ||||
limit, | ||||
discover_changed_paths, | ||||
strict_node_history, | ||||
receiver, | ||||
) | ||||
Mads Kiilerich
|
r20420 | |||
def close(self): | ||||
pass | ||||
Augie Fackler
|
r8074 | |||
Augie Fackler
|
r43346 | |||
Augie Fackler
|
r8074 | # Check to see if the given path is a local Subversion repo. Verify this by | ||
# looking for several svn-specific files and directories in the given | ||||
# directory. | ||||
Patrick Mezard
|
r9829 | def filecheck(ui, path, proto): | ||
Augie Fackler
|
r43347 | for x in (b'locks', b'hooks', b'format', b'db'): | ||
Augie Fackler
|
r8074 | if not os.path.exists(os.path.join(path, x)): | ||
return False | ||||
return True | ||||
Augie Fackler
|
r43346 | |||
Augie Fackler
|
r8074 | # Check to see if a given path is the root of an svn repo over http. We verify | ||
# this by requesting a version-controlled URL we know can't exist and looking | ||||
# for the svn-specific "not found" XML. | ||||
Patrick Mezard
|
r9829 | def httpcheck(ui, path, proto): | ||
try: | ||||
timeless
|
r28883 | opener = urlreq.buildopener() | ||
Manuel Jacob
|
r45560 | rsp = opener.open( | ||
pycompat.strurl(b'%s://%s/!svn/ver/0/.svn' % (proto, path)), b'rb' | ||||
) | ||||
Matt Mackall
|
r10282 | data = rsp.read() | ||
timeless
|
r28883 | except urlerr.httperror as inst: | ||
Patrick Mezard
|
r9838 | if inst.code != 404: | ||
# Except for 404 we cannot know for sure this is not an svn repo | ||||
Augie Fackler
|
r43346 | ui.warn( | ||
_( | ||||
Augie Fackler
|
r43347 | b'svn: cannot probe remote repository, assume it could ' | ||
b'be a subversion repository. Use --source-type if you ' | ||||
b'know better.\n' | ||||
Augie Fackler
|
r43346 | ) | ||
) | ||||
Patrick Mezard
|
r9838 | return True | ||
data = inst.fp.read() | ||||
Brodie Rao
|
r16689 | except Exception: | ||
timeless
|
r28883 | # Could be urlerr.urlerror if the URL is invalid or anything else. | ||
Patrick Mezard
|
r9829 | return False | ||
Augie Fackler
|
r43347 | return b'<m:human-readable errcode="160013">' in data | ||
Augie Fackler
|
r8074 | |||
Augie Fackler
|
r43346 | |||
protomap = { | ||||
Augie Fackler
|
r43347 | b'http': httpcheck, | ||
b'https': httpcheck, | ||||
b'file': filecheck, | ||||
Augie Fackler
|
r43346 | } | ||
Manuel Jacob
|
r45566 | class NonUtf8PercentEncodedBytes(Exception): | ||
pass | ||||
# Subversion paths are Unicode. Since the percent-decoding is done on | ||||
# UTF-8-encoded strings, percent-encoded bytes are interpreted as UTF-8. | ||||
def url2pathname_like_subversion(unicodepath): | ||||
if pycompat.ispy3: | ||||
# On Python 3, we have to pass unicode to urlreq.url2pathname(). | ||||
# Percent-decoded bytes get decoded using UTF-8 and the 'replace' error | ||||
# handler. | ||||
unicodepath = urlreq.url2pathname(unicodepath) | ||||
if u'\N{REPLACEMENT CHARACTER}' in unicodepath: | ||||
raise NonUtf8PercentEncodedBytes | ||||
else: | ||||
return unicodepath | ||||
else: | ||||
# If we passed unicode on Python 2, it would be converted using the | ||||
# latin-1 encoding. Therefore, we pass UTF-8-encoded bytes. | ||||
unicodepath = urlreq.url2pathname(unicodepath.encode('utf-8')) | ||||
try: | ||||
return unicodepath.decode('utf-8') | ||||
except UnicodeDecodeError: | ||||
raise NonUtf8PercentEncodedBytes | ||||
Patrick Mezard
|
r9829 | def issvnurl(ui, url): | ||
Edouard Gomez
|
r8764 | try: | ||
Augie Fackler
|
r43347 | proto, path = url.split(b'://', 1) | ||
if proto == b'file': | ||||
Augie Fackler
|
r43346 | if ( | ||
pycompat.iswindows | ||||
Augie Fackler
|
r43347 | and path[:1] == b'/' | ||
Augie Fackler
|
r43346 | and path[1:2].isalpha() | ||
Augie Fackler
|
r43347 | and path[2:6].lower() == b'%3a/' | ||
Augie Fackler
|
r43346 | ): | ||
Augie Fackler
|
r43347 | path = path[:2] + b':/' + path[6:] | ||
Manuel Jacob
|
r45562 | try: | ||
Manuel Jacob
|
r45566 | unicodepath = path.decode(fsencoding) | ||
Manuel Jacob
|
r45562 | except UnicodeDecodeError: | ||
ui.warn( | ||||
_( | ||||
b'Subversion requires that file URLs can be converted ' | ||||
b'to Unicode using the current locale encoding (%s)\n' | ||||
) | ||||
% pycompat.sysbytes(fsencoding) | ||||
) | ||||
return False | ||||
Manuel Jacob
|
r45566 | try: | ||
unicodepath = url2pathname_like_subversion(unicodepath) | ||||
except NonUtf8PercentEncodedBytes: | ||||
Manuel Jacob
|
r45495 | ui.warn( | ||
_( | ||||
Manuel Jacob
|
r45566 | b'Subversion does not support non-UTF-8 ' | ||
b'percent-encoded bytes in file URLs\n' | ||||
Manuel Jacob
|
r45495 | ) | ||
) | ||||
Manuel Jacob
|
r45566 | return False | ||
# Below, we approximate how Subversion checks the path. On Unix, we | ||||
# should therefore convert the path to bytes using `fsencoding` | ||||
# (like Subversion does). On Windows, the right thing would | ||||
# actually be to leave the path as unicode. For now, we restrict | ||||
# the path to MBCS. | ||||
path = unicodepath.encode(fsencoding) | ||||
Edouard Gomez
|
r8764 | except ValueError: | ||
Augie Fackler
|
r43347 | proto = b'file' | ||
r48434 | path = util.abspath(url) | |||
Manuel Jacob
|
r45561 | try: | ||
path.decode(fsencoding) | ||||
except UnicodeDecodeError: | ||||
ui.warn( | ||||
_( | ||||
b'Subversion requires that paths can be converted to ' | ||||
b'Unicode using the current locale encoding (%s)\n' | ||||
) | ||||
% pycompat.sysbytes(fsencoding) | ||||
) | ||||
return False | ||||
Augie Fackler
|
r43347 | if proto == b'file': | ||
FUJIWARA Katsunori
|
r16067 | path = util.pconvert(path) | ||
Manuel Jacob
|
r45559 | elif proto in (b'http', 'https'): | ||
if not encoding.isasciistr(path): | ||||
ui.warn( | ||||
_( | ||||
b"Subversion sources don't support non-ASCII characters in " | ||||
b"HTTP(S) URLs. Please percent-encode them.\n" | ||||
) | ||||
) | ||||
return False | ||||
Patrick Mezard
|
r10885 | check = protomap.get(proto, lambda *args: False) | ||
Augie Fackler
|
r43347 | while b'/' in path: | ||
Patrick Mezard
|
r9829 | if check(ui, path, proto): | ||
Augie Fackler
|
r8074 | return True | ||
Augie Fackler
|
r43347 | path = path.rsplit(b'/', 1)[0] | ||
Augie Fackler
|
r8074 | return False | ||
Augie Fackler
|
r43346 | |||
Daniel Holth
|
r4765 | # SVN conversion code stolen from bzr-svn and tailor | ||
Patrick Mezard
|
r5876 | # | ||
# Subversion looks like a versioned filesystem, branches structures | ||||
# are defined by conventions and not enforced by the tool. First, | ||||
# we define the potential branches (modules) as "trunk" and "branches" | ||||
# children directories. Revisions are then identified by their | ||||
# module and revision number (and a repository identifier). | ||||
# | ||||
# The revision graph is really a tree (or a forest). By default, a | ||||
# revision parent is the previous revision in the same module. If the | ||||
# module directory is copied/moved from another module then the | ||||
# revision is the module root and its parent the source revision in | ||||
# the parent module. A revision has at most one parent. | ||||
# | ||||
Bryan O'Sullivan
|
r5438 | class svn_source(converter_source): | ||
Matt Harbison
|
r35168 | def __init__(self, ui, repotype, url, revs=None): | ||
super(svn_source, self).__init__(ui, repotype, url, revs=revs) | ||||
Brendan Cully
|
r4807 | |||
Manuel Jacob
|
r45561 | init_fsencoding() | ||
Augie Fackler
|
r43346 | if not ( | ||
Augie Fackler
|
r43347 | url.startswith(b'svn://') | ||
or url.startswith(b'svn+ssh://') | ||||
Augie Fackler
|
r43346 | or ( | ||
os.path.exists(url) | ||||
Augie Fackler
|
r43347 | and os.path.exists(os.path.join(url, b'.svn')) | ||
Augie Fackler
|
r43346 | ) | ||
or issvnurl(ui, url) | ||||
): | ||||
raise NoRepo( | ||||
Augie Fackler
|
r43347 | _(b"%s does not look like a Subversion repository") % url | ||
Augie Fackler
|
r43346 | ) | ||
Azhagu Selvan SP
|
r13480 | if svn is None: | ||
Augie Fackler
|
r43347 | raise MissingTool(_(b'could not load Subversion python bindings')) | ||
Patrick Mezard
|
r7447 | |||
try: | ||||
version = svn.core.SVN_VER_MAJOR, svn.core.SVN_VER_MINOR | ||||
if version < (1, 4): | ||||
Augie Fackler
|
r43346 | raise MissingTool( | ||
_( | ||||
Augie Fackler
|
r43347 | b'Subversion python bindings %d.%d found, ' | ||
b'1.4 or later required' | ||||
Augie Fackler
|
r43346 | ) | ||
% version | ||||
) | ||||
Patrick Mezard
|
r7447 | except AttributeError: | ||
Augie Fackler
|
r43346 | raise MissingTool( | ||
_( | ||||
Augie Fackler
|
r43347 | b'Subversion python bindings are too old, 1.4 ' | ||
b'or later required' | ||||
Augie Fackler
|
r43346 | ) | ||
) | ||||
Brendan Cully
|
r4766 | |||
Brendan Cully
|
r4813 | self.lastrevs = {} | ||
Brendan Cully
|
r4766 | latest = None | ||
Daniel Holth
|
r4765 | try: | ||
# Support file://path@rev syntax. Useful e.g. to convert | ||||
# deleted branches. | ||||
Augie Fackler
|
r43347 | at = url.rfind(b'@') | ||
Bryan O'Sullivan
|
r4927 | if at >= 0: | ||
Augie Fackler
|
r43346 | latest = int(url[at + 1 :]) | ||
Bryan O'Sullivan
|
r4927 | url = url[:at] | ||
Peter Arrenbrecht
|
r7874 | except ValueError: | ||
Brendan Cully
|
r4766 | pass | ||
Brendan Cully
|
r5008 | self.url = geturl(url) | ||
Augie Fackler
|
r43347 | self.encoding = b'UTF-8' # Subversion is always nominal UTF-8 | ||
Daniel Holth
|
r4765 | try: | ||
Manuel Jacob
|
r45551 | with util.with_lc_ctype(): | ||
self.transport = transport.SvnRaTransport(url=self.url) | ||||
self.ra = self.transport.ra | ||||
self.ctx = self.transport.client | ||||
self.baseurl = svn.ra.get_repos_root(self.ra) | ||||
# Module is either empty or a repository path starting with | ||||
# a slash and not ending with a slash. | ||||
self.module = urlreq.unquote(self.url[len(self.baseurl) :]) | ||||
self.prevmodule = None | ||||
self.rootmodule = self.module | ||||
self.commits = {} | ||||
self.paths = {} | ||||
self.uuid = svn.ra.get_uuid(self.ra) | ||||
FUJIWARA Katsunori
|
r28460 | except svn.core.SubversionException: | ||
Matt Mackall
|
r8206 | ui.traceback() | ||
Augie Fackler
|
r43347 | svnversion = b'%d.%d.%d' % ( | ||
Augie Fackler
|
r43346 | svn.core.SVN_VER_MAJOR, | ||
svn.core.SVN_VER_MINOR, | ||||
svn.core.SVN_VER_MICRO, | ||||
) | ||||
raise NoRepo( | ||||
_( | ||||
Augie Fackler
|
r43347 | b"%s does not look like a Subversion repository " | ||
b"to libsvn version %s" | ||||
Augie Fackler
|
r43346 | ) | ||
% (self.url, svnversion) | ||||
) | ||||
Daniel Holth
|
r4765 | |||
Durham Goode
|
r25748 | if revs: | ||
if len(revs) > 1: | ||||
Augie Fackler
|
r43346 | raise error.Abort( | ||
_( | ||||
Augie Fackler
|
r43347 | b'subversion source does not support ' | ||
b'specifying multiple revisions' | ||||
Augie Fackler
|
r43346 | ) | ||
) | ||||
Thomas Arendsen Hein
|
r5145 | try: | ||
Durham Goode
|
r25748 | latest = int(revs[0]) | ||
Thomas Arendsen Hein
|
r5145 | except ValueError: | ||
Augie Fackler
|
r43346 | raise error.Abort( | ||
Augie Fackler
|
r43347 | _(b'svn: revision %s is not an integer') % revs[0] | ||
Augie Fackler
|
r43346 | ) | ||
Thomas Arendsen Hein
|
r5145 | |||
Augie Fackler
|
r43347 | trunkcfg = self.ui.config(b'convert', b'svn.trunk') | ||
Augie Fackler
|
r34891 | if trunkcfg is None: | ||
Augie Fackler
|
r43347 | trunkcfg = b'trunk' | ||
self.trunkname = trunkcfg.strip(b'/') | ||||
self.startrev = self.ui.config(b'convert', b'svn.startrev') | ||||
Patrick Mezard
|
r6173 | try: | ||
self.startrev = int(self.startrev) | ||||
if self.startrev < 0: | ||||
self.startrev = 0 | ||||
except ValueError: | ||||
Augie Fackler
|
r43346 | raise error.Abort( | ||
Augie Fackler
|
r43347 | _(b'svn: start revision %s is not an integer') % self.startrev | ||
Augie Fackler
|
r43346 | ) | ||
Patrick Mezard
|
r6173 | |||
Mads Kiilerich
|
r14152 | try: | ||
Manuel Jacob
|
r45551 | with util.with_lc_ctype(): | ||
self.head = self.latest(self.module, latest) | ||||
Mads Kiilerich
|
r14152 | except SvnPathNotFound: | ||
self.head = None | ||||
Patrick Mezard
|
r5957 | if not self.head: | ||
Augie Fackler
|
r43347 | raise error.Abort( | ||
_(b'no revision found in module %s') % self.module | ||||
) | ||||
Patrick Mezard
|
r5955 | self.last_changed = self.revnum(self.head) | ||
Thomas Arendsen Hein
|
r6210 | |||
Mads Kiilerich
|
r22298 | self._changescache = (None, None) | ||
Daniel Holth
|
r4765 | |||
Augie Fackler
|
r43347 | if os.path.exists(os.path.join(url, b'.svn/entries')): | ||
Bryan O'Sullivan
|
r5554 | self.wc = url | ||
else: | ||||
self.wc = None | ||||
self.convertfp = None | ||||
Manuel Jacob
|
r45551 | def before(self): | ||
self.with_lc_ctype = util.with_lc_ctype() | ||||
self.with_lc_ctype.__enter__() | ||||
def after(self): | ||||
self.with_lc_ctype.__exit__(None, None, None) | ||||
Bryan O'Sullivan
|
r5510 | def setrevmap(self, revmap): | ||
Brendan Cully
|
r4840 | lastrevs = {} | ||
Augie Fackler
|
r36313 | for revid in revmap: | ||
Patrick Mezard
|
r13690 | uuid, module, revnum = revsplit(revid) | ||
Brendan Cully
|
r4840 | lastrevnum = lastrevs.setdefault(module, revnum) | ||
if revnum > lastrevnum: | ||||
lastrevs[module] = revnum | ||||
self.lastrevs = lastrevs | ||||
Bryan O'Sullivan
|
r4925 | def exists(self, path, optrev): | ||
try: | ||||
Augie Fackler
|
r43346 | svn.client.ls( | ||
Augie Fackler
|
r43347 | self.url.rstrip(b'/') + b'/' + quote(path), | ||
Augie Fackler
|
r43346 | optrev, | ||
False, | ||||
self.ctx, | ||||
) | ||||
Kirill Smelkov
|
r5461 | return True | ||
FUJIWARA Katsunori
|
r28460 | except svn.core.SubversionException: | ||
Kirill Smelkov
|
r5461 | return False | ||
Bryan O'Sullivan
|
r4925 | |||
Brendan Cully
|
r4840 | def getheads(self): | ||
Patrick Mezard
|
r6491 | def isdir(path, revnum): | ||
Patrick Mezard
|
r6848 | kind = self._checkpath(path, revnum) | ||
Patrick Mezard
|
r6491 | return kind == svn.core.svn_node_dir | ||
Edouard Gomez
|
r5854 | def getcfgpath(name, rev): | ||
Augie Fackler
|
r43347 | cfgpath = self.ui.config(b'convert', b'svn.' + name) | ||
if cfgpath is not None and cfgpath.strip() == b'': | ||||
Patrick Mezard
|
r6172 | return None | ||
Augie Fackler
|
r43347 | path = (cfgpath or name).strip(b'/') | ||
Edouard Gomez
|
r5854 | if not self.exists(path, rev): | ||
Augie Fackler
|
r43347 | if self.module.endswith(path) and name == b'trunk': | ||
Pavel Boldin
|
r13494 | # we are converting from inside this directory | ||
return None | ||||
Edouard Gomez
|
r5854 | if cfgpath: | ||
Augie Fackler
|
r43346 | raise error.Abort( | ||
Augie Fackler
|
r43347 | _(b'expected %s to be at %r, but not found') | ||
Augie Fackler
|
r43346 | % (name, path) | ||
) | ||||
Edouard Gomez
|
r5854 | return None | ||
Manuel Jacob
|
r45497 | self.ui.note( | ||
_(b'found %s at %r\n') % (name, pycompat.bytestr(path)) | ||||
) | ||||
Edouard Gomez
|
r5854 | return path | ||
Brendan Cully
|
r5117 | rev = optrev(self.last_changed) | ||
Augie Fackler
|
r43347 | oldmodule = b'' | ||
trunk = getcfgpath(b'trunk', rev) | ||||
self.tags = getcfgpath(b'tags', rev) | ||||
branches = getcfgpath(b'branches', rev) | ||||
Edouard Gomez
|
r5854 | |||
# If the project has a trunk or branches, we will extract heads | ||||
# from them. We keep the project root otherwise. | ||||
if trunk: | ||||
Augie Fackler
|
r43347 | oldmodule = self.module or b'' | ||
self.module += b'/' + trunk | ||||
Patrick Mezard
|
r5955 | self.head = self.latest(self.module, self.last_changed) | ||
Patrick Mezard
|
r5957 | if not self.head: | ||
Augie Fackler
|
r43346 | raise error.Abort( | ||
Augie Fackler
|
r43347 | _(b'no revision found in module %s') % self.module | ||
Augie Fackler
|
r43346 | ) | ||
Edouard Gomez
|
r5854 | |||
# First head in the list is the module's head | ||||
self.heads = [self.head] | ||||
Patrick Mezard
|
r6400 | if self.tags is not None: | ||
Augie Fackler
|
r43347 | self.tags = b'%s/%s' % (oldmodule, (self.tags or b'tags')) | ||
Edouard Gomez
|
r5854 | |||
# Check if branches bring a few more heads to the list | ||||
if branches: | ||||
Augie Fackler
|
r43347 | rpath = self.url.strip(b'/') | ||
Augie Fackler
|
r43346 | branchnames = svn.client.ls( | ||
Augie Fackler
|
r43347 | rpath + b'/' + quote(branches), rev, False, self.ctx | ||
Augie Fackler
|
r43346 | ) | ||
Mads Kiilerich
|
r18374 | for branch in sorted(branchnames): | ||
Augie Fackler
|
r43347 | module = b'%s/%s/%s' % (oldmodule, branches, branch) | ||
Patrick Mezard
|
r6491 | if not isdir(module, self.last_changed): | ||
continue | ||||
Patrick Mezard
|
r5955 | brevid = self.latest(module, self.last_changed) | ||
Patrick Mezard
|
r5957 | if not brevid: | ||
Augie Fackler
|
r43347 | self.ui.note(_(b'ignoring empty branch %s\n') % branch) | ||
Patrick Mezard
|
r5957 | continue | ||
Augie Fackler
|
r43346 | self.ui.note( | ||
Augie Fackler
|
r43347 | _(b'found branch %s at %d\n') | ||
% (branch, self.revnum(brevid)) | ||||
Augie Fackler
|
r43346 | ) | ||
Patrick Mezard
|
r5955 | self.heads.append(brevid) | ||
Kirill Smelkov
|
r5462 | |||
Patrick Mezard
|
r6173 | if self.startrev and self.heads: | ||
if len(self.heads) > 1: | ||||
Augie Fackler
|
r43346 | raise error.Abort( | ||
_( | ||||
Augie Fackler
|
r43347 | b'svn: start revision is not supported ' | ||
b'with more than one branch' | ||||
Augie Fackler
|
r43346 | ) | ||
) | ||||
Patrick Mezard
|
r6173 | revnum = self.revnum(self.heads[0]) | ||
if revnum < self.startrev: | ||||
Pierre-Yves David
|
r26587 | raise error.Abort( | ||
Augie Fackler
|
r43347 | _(b'svn: no revision found after start revision %d') | ||
Augie Fackler
|
r43346 | % self.startrev | ||
) | ||||
Patrick Mezard
|
r6173 | |||
Brendan Cully
|
r4840 | return self.heads | ||
Mads Kiilerich
|
r22300 | def _getchanges(self, rev, full): | ||
Brendan Cully
|
r5121 | (paths, parents) = self.paths[rev] | ||
Mads Kiilerich
|
r22300 | copies = {} | ||
Patrick Mezard
|
r5956 | if parents: | ||
Patrick Mezard
|
r11127 | files, self.removed, copies = self.expandpaths(rev, paths, parents) | ||
Mads Kiilerich
|
r22300 | if full or not parents: | ||
Patrick Mezard
|
r5956 | # Perform a full checkout on roots | ||
Patrick Mezard
|
r13690 | uuid, module, revnum = revsplit(rev) | ||
Augie Fackler
|
r43346 | entries = svn.client.ls( | ||
self.baseurl + quote(module), optrev(revnum), True, self.ctx | ||||
) | ||||
files = [ | ||||
n | ||||
Gregory Szorc
|
r49768 | for n, e in entries.items() | ||
Augie Fackler
|
r43346 | if e.kind == svn.core.svn_node_file | ||
] | ||||
Patrick Mezard
|
r11127 | self.removed = set() | ||
Patrick Mezard
|
r5956 | |||
Brendan Cully
|
r5121 | files.sort() | ||
Manuel Jacob
|
r45493 | files = pycompat.ziplist(files, [rev] * len(files)) | ||
Mads Kiilerich
|
r22298 | return (files, copies) | ||
Brendan Cully
|
r5121 | |||
Mads Kiilerich
|
r22300 | def getchanges(self, rev, full): | ||
Mads Kiilerich
|
r22298 | # reuse cache from getchangedfiles | ||
Mads Kiilerich
|
r22300 | if self._changescache[0] == rev and not full: | ||
Mads Kiilerich
|
r22298 | (files, copies) = self._changescache[1] | ||
else: | ||||
Mads Kiilerich
|
r22300 | (files, copies) = self._getchanges(rev, full) | ||
Mads Kiilerich
|
r22298 | # caller caches the result, so free it here to release memory | ||
del self.paths[rev] | ||||
Mads Kiilerich
|
r24395 | return (files, copies, set()) | ||
Brendan Cully
|
r4840 | |||
Alexis S. L. Carvalho
|
r5382 | def getchangedfiles(self, rev, i): | ||
Mads Kiilerich
|
r22298 | # called from filemap - cache computed values for reuse in getchanges | ||
Mads Kiilerich
|
r22300 | (files, copies) = self._getchanges(rev, False) | ||
Mads Kiilerich
|
r22298 | self._changescache = (rev, (files, copies)) | ||
return [f[0] for f in files] | ||||
Alexis S. L. Carvalho
|
r5382 | |||
Brendan Cully
|
r4840 | def getcommit(self, rev): | ||
if rev not in self.commits: | ||||
Patrick Mezard
|
r13690 | uuid, module, revnum = revsplit(rev) | ||
Brendan Cully
|
r4840 | self.module = module | ||
self.reparent(module) | ||||
Patrick Mezard
|
r5875 | # We assume that: | ||
# - requests for revisions after "stop" come from the | ||||
# revision graph backward traversal. Cache all of them | ||||
# down to stop, they will be used eventually. | ||||
# - requests for revisions before "stop" come to get | ||||
# isolated branches parents. Just fetch what is needed. | ||||
Brendan Cully
|
r4840 | stop = self.lastrevs.get(module, 0) | ||
Patrick Mezard
|
r5875 | if revnum < stop: | ||
stop = revnum + 1 | ||||
Patrick Mezard
|
r5871 | self._fetch_revisions(revnum, stop) | ||
Jesus Espino Garcia
|
r15970 | if rev not in self.commits: | ||
Augie Fackler
|
r43347 | raise error.Abort(_(b'svn: revision %s not found') % revnum) | ||
Mads Kiilerich
|
r22201 | revcommit = self.commits[rev] | ||
Brendan Cully
|
r4840 | # caller caches the result, so free it here to release memory | ||
del self.commits[rev] | ||||
Mads Kiilerich
|
r22201 | return revcommit | ||
Brendan Cully
|
r4840 | |||
Augie Fackler
|
r43347 | def checkrevformat(self, revstr, mapname=b'splicemap'): | ||
Kyle Lippincott
|
r47856 | """fails if revision format does not match the correct format""" | ||
Augie Fackler
|
r43346 | if not re.match( | ||
Manuel Jacob
|
r45498 | br'svn:[0-9a-f]{8,8}-[0-9a-f]{4,4}-' | ||
br'[0-9a-f]{4,4}-[0-9a-f]{4,4}-[0-9a-f]' | ||||
br'{12,12}(.*)@[0-9]+$', | ||||
Augie Fackler
|
r43346 | revstr, | ||
): | ||||
raise error.Abort( | ||||
Martin von Zweigbergk
|
r43387 | _(b'%s entry %s is not a valid revision identifier') | ||
Augie Fackler
|
r43346 | % (mapname, revstr) | ||
) | ||||
Ben Goswami
|
r19122 | |||
Augie Fackler
|
r22414 | def numcommits(self): | ||
Augie Fackler
|
r43347 | return int(self.head.rsplit(b'@', 1)[1]) - self.startrev | ||
Augie Fackler
|
r22414 | |||
Brendan Cully
|
r4840 | def gettags(self): | ||
tags = {} | ||||
Patrick Mezard
|
r6172 | if self.tags is None: | ||
return tags | ||||
Thomas Arendsen Hein
|
r6210 | |||
Patrick Mezard
|
r6399 | # svn tags are just a convention, project branches left in a | ||
# 'tags' directory. There is no other relationship than | ||||
# ancestry, which is expensive to discover and makes them hard | ||||
# to update incrementally. Worse, past revisions may be | ||||
# referenced by tags far away in the future, requiring a deep | ||||
# history traversal on every calculation. Current code | ||||
# performs a single backward traversal, tracking moves within | ||||
# the tags directory (tag renaming) and recording a new tag | ||||
# everytime a project is copied from outside the tags | ||||
# directory. It also lists deleted tags, this behaviour may | ||||
# change in the future. | ||||
pendings = [] | ||||
tagspath = self.tags | ||||
start = svn.ra.get_latest_revnum(self.ra) | ||||
Aaron Digulla
|
r11195 | stream = self._getlog([self.tags], start, self.startrev) | ||
try: | ||||
for entry in stream: | ||||
origpaths, revnum, author, date, message = entry | ||||
Matt Mackall
|
r19468 | if not origpaths: | ||
origpaths = [] | ||||
Augie Fackler
|
r43346 | copies = [ | ||
(e.copyfrom_path, e.copyfrom_rev, p) | ||||
Gregory Szorc
|
r49768 | for p, e in origpaths.items() | ||
Augie Fackler
|
r43346 | if e.copyfrom_path | ||
] | ||||
Aaron Digulla
|
r11195 | # Apply moves/copies from more specific to general | ||
copies.sort(reverse=True) | ||||
Patrick Mezard
|
r6399 | |||
Aaron Digulla
|
r11195 | srctagspath = tagspath | ||
if copies and copies[-1][2] == tagspath: | ||||
# Track tags directory moves | ||||
srctagspath = copies.pop()[0] | ||||
Patrick Mezard
|
r6399 | |||
Aaron Digulla
|
r11195 | for source, sourcerev, dest in copies: | ||
Augie Fackler
|
r43347 | if not dest.startswith(tagspath + b'/'): | ||
Aaron Digulla
|
r11195 | continue | ||
for tag in pendings: | ||||
if tag[0].startswith(dest): | ||||
Augie Fackler
|
r43346 | tagpath = source + tag[0][len(dest) :] | ||
Aaron Digulla
|
r11195 | tag[:2] = [tagpath, sourcerev] | ||
break | ||||
else: | ||||
pendings.append([source, sourcerev, dest]) | ||||
Patrick Mezard
|
r8248 | |||
Aaron Digulla
|
r11195 | # Filter out tags with children coming from different | ||
# parts of the repository like: | ||||
# /tags/tag.1 (from /trunk:10) | ||||
# /tags/tag.1/foo (from /branches/foo:12) | ||||
# Here/tags/tag.1 discarded as well as its children. | ||||
# It happens with tools like cvs2svn. Such tags cannot | ||||
# be represented in mercurial. | ||||
Augie Fackler
|
r44937 | addeds = { | ||
p: e.copyfrom_path | ||||
Gregory Szorc
|
r49768 | for p, e in origpaths.items() | ||
Augie Fackler
|
r43347 | if e.action == b'A' and e.copyfrom_path | ||
Augie Fackler
|
r44937 | } | ||
Aaron Digulla
|
r11195 | badroots = set() | ||
for destroot in addeds: | ||||
for source, sourcerev, dest in pendings: | ||||
Augie Fackler
|
r43346 | if not dest.startswith( | ||
Augie Fackler
|
r43347 | destroot + b'/' | ||
) or source.startswith(addeds[destroot] + b'/'): | ||||
Aaron Digulla
|
r11195 | continue | ||
badroots.add(destroot) | ||||
break | ||||
Patrick Mezard
|
r8248 | |||
Aaron Digulla
|
r11195 | for badroot in badroots: | ||
Augie Fackler
|
r43346 | pendings = [ | ||
p | ||||
for p in pendings | ||||
if p[2] != badroot | ||||
Augie Fackler
|
r43347 | and not p[2].startswith(badroot + b'/') | ||
Augie Fackler
|
r43346 | ] | ||
Patrick Mezard
|
r6399 | |||
Aaron Digulla
|
r11195 | # Tell tag renamings from tag creations | ||
Martin Geisler
|
r15124 | renamings = [] | ||
Aaron Digulla
|
r11195 | for source, sourcerev, dest in pendings: | ||
Augie Fackler
|
r43347 | tagname = dest.split(b'/')[-1] | ||
Aaron Digulla
|
r11195 | if source.startswith(srctagspath): | ||
Martin Geisler
|
r15124 | renamings.append([source, sourcerev, tagname]) | ||
Aaron Digulla
|
r11195 | continue | ||
if tagname in tags: | ||||
# Keep the latest tag value | ||||
continue | ||||
# From revision may be fake, get one with changes | ||||
try: | ||||
tagid = self.latest(source, sourcerev) | ||||
if tagid and tagname not in tags: | ||||
tags[tagname] = tagid | ||||
except SvnPathNotFound: | ||||
# It happens when we are following directories | ||||
# we assumed were copied with their parents | ||||
# but were really created in the tag | ||||
# directory. | ||||
pass | ||||
Martin Geisler
|
r15124 | pendings = renamings | ||
Aaron Digulla
|
r11195 | tagspath = srctagspath | ||
finally: | ||||
stream.close() | ||||
Bryan O'Sullivan
|
r4946 | return tags | ||
Brendan Cully
|
r4840 | |||
Bryan O'Sullivan
|
r5554 | def converted(self, rev, destrev): | ||
if not self.wc: | ||||
return | ||||
if self.convertfp is None: | ||||
Augie Fackler
|
r43346 | self.convertfp = open( | ||
Augie Fackler
|
r43347 | os.path.join(self.wc, b'.svn', b'hg-shamap'), b'ab' | ||
Augie Fackler
|
r43346 | ) | ||
self.convertfp.write( | ||||
Augie Fackler
|
r43347 | util.tonativeeol(b'%s %d\n' % (destrev, self.revnum(rev))) | ||
Augie Fackler
|
r43346 | ) | ||
Bryan O'Sullivan
|
r5554 | self.convertfp.flush() | ||
Brendan Cully
|
r4810 | def revid(self, revnum, module=None): | ||
Manuel Jacob
|
r45492 | return b'svn:%s%s@%d' % (self.uuid, module or self.module, revnum) | ||
Brendan Cully
|
r4774 | |||
def revnum(self, rev): | ||||
Augie Fackler
|
r43347 | return int(rev.split(b'@')[-1]) | ||
Brendan Cully
|
r4789 | |||
Patrick Mezard
|
r16464 | def latest(self, path, stop=None): | ||
"""Find the latest revid affecting path, up to stop revision | ||||
number. If stop is None, default to repository latest | ||||
revision. It may return a revision in a different module, | ||||
since a branch may be moved without a change being | ||||
reported. Return None if computed module does not belong to | ||||
rootmodule subtree. | ||||
Patrick Mezard
|
r5955 | """ | ||
Augie Fackler
|
r43346 | |||
Patrick Mezard
|
r16466 | def findchanges(path, start, stop=None): | ||
stream = self._getlog([path], start, stop or 1) | ||||
Patrick Mezard
|
r16465 | try: | ||
for entry in stream: | ||||
paths, revnum, author, date, message = entry | ||||
Patrick Mezard
|
r16466 | if stop is None and paths: | ||
# We do not know the latest changed revision, | ||||
# keep the first one with changed paths. | ||||
break | ||||
Manuel Jacob
|
r45499 | if stop is not None and revnum <= stop: | ||
Patrick Mezard
|
r16465 | break | ||
for p in paths: | ||||
Augie Fackler
|
r43346 | if not path.startswith(p) or not paths[p].copyfrom_path: | ||
Patrick Mezard
|
r16465 | continue | ||
Augie Fackler
|
r43346 | newpath = paths[p].copyfrom_path + path[len(p) :] | ||
self.ui.debug( | ||||
Augie Fackler
|
r43347 | b"branch renamed from %s to %s at %d\n" | ||
Augie Fackler
|
r43346 | % (path, newpath, revnum) | ||
) | ||||
Patrick Mezard
|
r16465 | path = newpath | ||
break | ||||
Patrick Mezard
|
r16466 | if not paths: | ||
revnum = None | ||||
Patrick Mezard
|
r16465 | return revnum, path | ||
finally: | ||||
stream.close() | ||||
Patrick Mezard
|
r6281 | if not path.startswith(self.rootmodule): | ||
# Requests on foreign branches may be forbidden at server level | ||||
Augie Fackler
|
r43347 | self.ui.debug(b'ignoring foreign branch %r\n' % path) | ||
Patrick Mezard
|
r6281 | return None | ||
Patrick Mezard
|
r16464 | if stop is None: | ||
Brendan Cully
|
r4789 | stop = svn.ra.get_latest_revnum(self.ra) | ||
try: | ||||
Augie Fackler
|
r43347 | prevmodule = self.reparent(b'') | ||
dirent = svn.ra.stat(self.ra, path.strip(b'/'), stop) | ||||
Patrick Mezard
|
r6847 | self.reparent(prevmodule) | ||
FUJIWARA Katsunori
|
r28460 | except svn.core.SubversionException: | ||
Brendan Cully
|
r4789 | dirent = None | ||
if not dirent: | ||||
Augie Fackler
|
r43346 | raise SvnPathNotFound( | ||
Augie Fackler
|
r43347 | _(b'%s not found up to revision %d') % (path, stop) | ||
Augie Fackler
|
r43346 | ) | ||
Brendan Cully
|
r4789 | |||
Martin Geisler
|
r8660 | # stat() gives us the previous revision on this line of | ||
# development, but it might be in *another module*. Fetch the | ||||
# log and detect renames down to the latest revision. | ||||
Patrick Mezard
|
r16465 | revnum, realpath = findchanges(path, stop, dirent.created_rev) | ||
Patrick Mezard
|
r16466 | if revnum is None: | ||
# Tools like svnsync can create empty revision, when | ||||
# synchronizing only a subtree for instance. These empty | ||||
# revisions created_rev still have their original values | ||||
# despite all changes having disappeared and can be | ||||
# returned by ra.stat(), at least when stating the root | ||||
# module. In that case, do not trust created_rev and scan | ||||
# the whole history. | ||||
revnum, realpath = findchanges(path, stop) | ||||
if revnum is None: | ||||
Augie Fackler
|
r43347 | self.ui.debug(b'ignoring empty branch %r\n' % realpath) | ||
Patrick Mezard
|
r16466 | return None | ||
Patrick Mezard
|
r16465 | if not realpath.startswith(self.rootmodule): | ||
Augie Fackler
|
r43347 | self.ui.debug(b'ignoring foreign branch %r\n' % realpath) | ||
Patrick Mezard
|
r5957 | return None | ||
Patrick Mezard
|
r16465 | return self.revid(revnum, realpath) | ||
Brendan Cully
|
r4789 | |||
Daniel Holth
|
r4765 | def reparent(self, module): | ||
Patrick Mezard
|
r6847 | """Reparent the svn transport and return the previous parent.""" | ||
if self.prevmodule == module: | ||||
return module | ||||
Patrick Mezard
|
r15599 | svnurl = self.baseurl + quote(module) | ||
Patrick Mezard
|
r6847 | prevmodule = self.prevmodule | ||
if prevmodule is None: | ||||
Augie Fackler
|
r43347 | prevmodule = b'' | ||
self.ui.debug(b"reparent to %s\n" % svnurl) | ||||
Patrick Mezard
|
r7074 | svn.ra.reparent(self.ra, svnurl) | ||
Patrick Mezard
|
r6847 | self.prevmodule = module | ||
return prevmodule | ||||
Daniel Holth
|
r4765 | |||
Brendan Cully
|
r5120 | def expandpaths(self, rev, paths, parents): | ||
Patrick Mezard
|
r11127 | changed, removed = set(), set() | ||
Brendan Cully
|
r5120 | copies = {} | ||
Patrick Mezard
|
r13690 | new_module, revnum = revsplit(rev)[1:] | ||
Patrick Mezard
|
r5872 | if new_module != self.module: | ||
self.module = new_module | ||||
self.reparent(self.module) | ||||
Brendan Cully
|
r5121 | |||
Augie Fackler
|
r43346 | progress = self.ui.makeprogress( | ||
Augie Fackler
|
r43347 | _(b'scanning paths'), unit=_(b'paths'), total=len(paths) | ||
Augie Fackler
|
r43346 | ) | ||
Patrick Mezard
|
r11137 | for i, (path, ent) in enumerate(paths): | ||
Martin von Zweigbergk
|
r38425 | progress.update(i, item=path) | ||
Patrick Mezard
|
r6539 | entrypath = self.getrelpath(path) | ||
Brendan Cully
|
r5120 | |||
Patrick Mezard
|
r6848 | kind = self._checkpath(entrypath, revnum) | ||
Brendan Cully
|
r5120 | if kind == svn.core.svn_node_file: | ||
Patrick Mezard
|
r11127 | changed.add(self.recode(entrypath)) | ||
Patrick Mezard
|
r6546 | if not ent.copyfrom_path or not parents: | ||
Patrick Mezard
|
r6544 | continue | ||
Martin Geisler
|
r8660 | # Copy sources not in parent revisions cannot be | ||
# represented, ignore their origin for now | ||||
Patrick Mezard
|
r13690 | pmodule, prevnum = revsplit(parents[0])[1:] | ||
Patrick Mezard
|
r6546 | if ent.copyfrom_rev < prevnum: | ||
continue | ||||
copyfrom_path = self.getrelpath(ent.copyfrom_path, pmodule) | ||||
Patrick Mezard
|
r6544 | if not copyfrom_path: | ||
continue | ||||
Augie Fackler
|
r43346 | self.ui.debug( | ||
Manuel Jacob
|
r45496 | b"copied to %s from %s@%d\n" | ||
Augie Fackler
|
r43346 | % (entrypath, copyfrom_path, ent.copyfrom_rev) | ||
) | ||||
Patrick Mezard
|
r8885 | copies[self.recode(entrypath)] = self.recode(copyfrom_path) | ||
Augie Fackler
|
r43346 | elif kind == 0: # gone, but had better be a deleted *file* | ||
Manuel Jacob
|
r45496 | self.ui.debug(b"gone from %d\n" % ent.copyfrom_rev) | ||
Patrick Mezard
|
r13690 | pmodule, prevnum = revsplit(parents[0])[1:] | ||
Augie Fackler
|
r43347 | parentpath = pmodule + b"/" + entrypath | ||
Patrick Mezard
|
r11128 | fromkind = self._checkpath(entrypath, prevnum, pmodule) | ||
Thomas Arendsen Hein
|
r6210 | |||
Patrick Mezard
|
r8881 | if fromkind == svn.core.svn_node_file: | ||
Patrick Mezard
|
r11127 | removed.add(self.recode(entrypath)) | ||
Brendan Cully
|
r5120 | elif fromkind == svn.core.svn_node_dir: | ||
Augie Fackler
|
r43347 | oroot = parentpath.strip(b'/') | ||
nroot = path.strip(b'/') | ||||
Patrick Mezard
|
r11133 | children = self._iterfiles(oroot, prevnum) | ||
Patrick Mezard
|
r11132 | for childpath in children: | ||
childpath = childpath.replace(oroot, nroot) | ||||
Augie Fackler
|
r43347 | childpath = self.getrelpath(b"/" + childpath, pmodule) | ||
Patrick Mezard
|
r11125 | if childpath: | ||
Patrick Mezard
|
r11127 | removed.add(self.recode(childpath)) | ||
Brendan Cully
|
r5120 | else: | ||
Augie Fackler
|
r43346 | self.ui.debug( | ||
Augie Fackler
|
r43347 | b'unknown path in revision %d: %s\n' % (revnum, path) | ||
Augie Fackler
|
r43346 | ) | ||
Martin Geisler
|
r12770 | elif kind == svn.core.svn_node_dir: | ||
Augie Fackler
|
r43347 | if ent.action == b'M': | ||
Patrick Mezard
|
r11128 | # If the directory just had a prop change, | ||
# then we shouldn't need to look for its children. | ||||
Patrick Mezard
|
r5870 | continue | ||
Augie Fackler
|
r43347 | if ent.action == b'R' and parents: | ||
Patrick Mezard
|
r11128 | # If a directory is replacing a file, mark the previous | ||
# file as deleted | ||||
Patrick Mezard
|
r13690 | pmodule, prevnum = revsplit(parents[0])[1:] | ||
Patrick Mezard
|
r11128 | pkind = self._checkpath(entrypath, prevnum, pmodule) | ||
if pkind == svn.core.svn_node_file: | ||||
removed.add(self.recode(entrypath)) | ||||
Patrick Mezard
|
r13052 | elif pkind == svn.core.svn_node_dir: | ||
# We do not know what files were kept or removed, | ||||
# mark them all as changed. | ||||
for childpath in self._iterfiles(pmodule, prevnum): | ||||
Augie Fackler
|
r43347 | childpath = self.getrelpath(b"/" + childpath) | ||
Patrick Mezard
|
r13052 | if childpath: | ||
changed.add(self.recode(childpath)) | ||||
Patrick Mezard
|
r5870 | |||
Patrick Mezard
|
r11133 | for childpath in self._iterfiles(path, revnum): | ||
Augie Fackler
|
r43347 | childpath = self.getrelpath(b"/" + childpath) | ||
Patrick Mezard
|
r11132 | if childpath: | ||
changed.add(self.recode(childpath)) | ||||
Brendan Cully
|
r5120 | |||
Patrick Mezard
|
r8881 | # Handle directory copies | ||
Patrick Mezard
|
r6543 | if not ent.copyfrom_path or not parents: | ||
Patrick Mezard
|
r6542 | continue | ||
Martin Geisler
|
r8660 | # Copy sources not in parent revisions cannot be | ||
# represented, ignore their origin for now | ||||
Patrick Mezard
|
r13690 | pmodule, prevnum = revsplit(parents[0])[1:] | ||
Patrick Mezard
|
r6543 | if ent.copyfrom_rev < prevnum: | ||
continue | ||||
Patrick Mezard
|
r8882 | copyfrompath = self.getrelpath(ent.copyfrom_path, pmodule) | ||
Patrick Mezard
|
r6542 | if not copyfrompath: | ||
continue | ||||
Augie Fackler
|
r43346 | self.ui.debug( | ||
Augie Fackler
|
r43347 | b"mark %s came from %s:%d\n" | ||
Augie Fackler
|
r43346 | % (path, copyfrompath, ent.copyfrom_rev) | ||
) | ||||
Patrick Mezard
|
r11133 | children = self._iterfiles(ent.copyfrom_path, ent.copyfrom_rev) | ||
Patrick Mezard
|
r11132 | for childpath in children: | ||
Augie Fackler
|
r43347 | childpath = self.getrelpath(b"/" + childpath, pmodule) | ||
Patrick Mezard
|
r11132 | if not childpath: | ||
Patrick Mezard
|
r6542 | continue | ||
Augie Fackler
|
r43346 | copytopath = path + childpath[len(copyfrompath) :] | ||
Patrick Mezard
|
r6542 | copytopath = self.getrelpath(copytopath) | ||
Patrick Mezard
|
r11132 | copies[self.recode(copytopath)] = self.recode(childpath) | ||
Brendan Cully
|
r5120 | |||
Martin von Zweigbergk
|
r38425 | progress.complete() | ||
Patrick Mezard
|
r11127 | changed.update(removed) | ||
return (list(changed), removed, copies) | ||||
Brendan Cully
|
r5120 | |||
Patrick Mezard
|
r5871 | def _fetch_revisions(self, from_revnum, to_revnum): | ||
if from_revnum < to_revnum: | ||||
from_revnum, to_revnum = to_revnum, from_revnum | ||||
Bryan O'Sullivan
|
r4940 | self.child_cset = None | ||
Patrick Mezard
|
r6545 | |||
Bryan O'Sullivan
|
r4946 | def parselogentry(orig_paths, revnum, author, date, message): | ||
Thomas Arendsen Hein
|
r6210 | """Return the parsed commit object or None, and True if | ||
Patrick Mezard
|
r5872 | the revision is a branch root. | ||
""" | ||||
Augie Fackler
|
r43346 | self.ui.debug( | ||
Augie Fackler
|
r43347 | b"parsing revision %d (%d changes)\n" | ||
% (revnum, len(orig_paths)) | ||||
Augie Fackler
|
r43346 | ) | ||
Bryan O'Sullivan
|
r4940 | |||
Patrick Mezard
|
r5957 | branched = False | ||
Brendan Cully
|
r4810 | rev = self.revid(revnum) | ||
Brendan Cully
|
r4837 | # branch log might return entries for a parent we already have | ||
Patrick Mezard
|
r5871 | |||
Martin Geisler
|
r8117 | if rev in self.commits or revnum < to_revnum: | ||
Patrick Mezard
|
r5957 | return None, branched | ||
Brendan Cully
|
r4837 | |||
Brendan Cully
|
r5120 | parents = [] | ||
Patrick Mezard
|
r5958 | # check whether this revision is the start of a branch or part | ||
# of a branch renaming | ||||
Gregory Szorc
|
r49768 | orig_paths = sorted(orig_paths.items()) | ||
Augie Fackler
|
r43346 | root_paths = [ | ||
(p, e) for p, e in orig_paths if self.module.startswith(p) | ||||
] | ||||
Patrick Mezard
|
r5958 | if root_paths: | ||
path, ent = root_paths[-1] | ||||
Brendan Cully
|
r5119 | if ent.copyfrom_path: | ||
Patrick Mezard
|
r5957 | branched = True | ||
Augie Fackler
|
r43346 | newpath = ent.copyfrom_path + self.module[len(path) :] | ||
Brendan Cully
|
r5119 | # ent.copyfrom_rev may not be the actual last revision | ||
Patrick Mezard
|
r7476 | previd = self.latest(newpath, ent.copyfrom_rev) | ||
Patrick Mezard
|
r5957 | if previd is not None: | ||
Patrick Mezard
|
r13690 | prevmodule, prevnum = revsplit(previd)[1:] | ||
Patrick Mezard
|
r6173 | if prevnum >= self.startrev: | ||
parents = [previd] | ||||
Matt Mackall
|
r10282 | self.ui.note( | ||
Augie Fackler
|
r43347 | _(b'found parent of branch %s at %d: %s\n') | ||
Augie Fackler
|
r43346 | % (self.module, prevnum, prevmodule) | ||
) | ||||
Brendan Cully
|
r5119 | else: | ||
Augie Fackler
|
r43347 | self.ui.debug(b"no copyfrom path, don't know what to do.\n") | ||
Brendan Cully
|
r5119 | |||
Brendan Cully
|
r5120 | paths = [] | ||
# filter out unrelated paths | ||||
Bryan O'Sullivan
|
r4940 | for path, ent in orig_paths: | ||
Patrick Mezard
|
r6540 | if self.getrelpath(path) is None: | ||
Brendan Cully
|
r4788 | continue | ||
Brendan Cully
|
r5120 | paths.append((path, ent)) | ||
Daniel Holth
|
r4765 | |||
Nikita Slyusarev
|
r47129 | date = parsesvndate(date) | ||
Augie Fackler
|
r43347 | if self.ui.configbool(b'convert', b'localtimezone'): | ||
Julian Cowley
|
r17974 | date = makedatetimestamp(date[0]) | ||
Daniel Holth
|
r4765 | |||
Jordi Gutiérrez Hermoso
|
r24306 | if message: | ||
log = self.recode(message) | ||||
else: | ||||
Augie Fackler
|
r43347 | log = b'' | ||
Jordi Gutiérrez Hermoso
|
r24306 | |||
if author: | ||||
author = self.recode(author) | ||||
else: | ||||
Augie Fackler
|
r43347 | author = b'' | ||
Jordi Gutiérrez Hermoso
|
r24306 | |||
Brendan Cully
|
r5120 | try: | ||
Augie Fackler
|
r43347 | branch = self.module.split(b"/")[-1] | ||
Patrick Mezard
|
r13529 | if branch == self.trunkname: | ||
branch = None | ||||
Brendan Cully
|
r5120 | except IndexError: | ||
branch = None | ||||
Daniel Holth
|
r4765 | |||
Augie Fackler
|
r43346 | cset = commit( | ||
author=author, | ||||
Augie Fackler
|
r43347 | date=dateutil.datestr(date, b'%Y-%m-%d %H:%M:%S %1%2'), | ||
Augie Fackler
|
r43346 | desc=log, | ||
parents=parents, | ||||
branch=branch, | ||||
rev=rev, | ||||
) | ||||
Brendan Cully
|
r4788 | |||
Brendan Cully
|
r4796 | self.commits[rev] = cset | ||
Patrick Mezard
|
r5872 | # The parents list is *shared* among self.paths and the | ||
# commit object. Both will be updated below. | ||||
self.paths[rev] = (paths, cset.parents) | ||||
Brendan Cully
|
r4796 | if self.child_cset and not self.child_cset.parents: | ||
Patrick Mezard
|
r5872 | self.child_cset.parents[:] = [rev] | ||
Brendan Cully
|
r4788 | self.child_cset = cset | ||
Patrick Mezard
|
r5957 | return cset, branched | ||
Brendan Cully
|
r4796 | |||
Augie Fackler
|
r43346 | self.ui.note( | ||
Augie Fackler
|
r43347 | _(b'fetching revision log for "%s" from %d to %d\n') | ||
Augie Fackler
|
r43346 | % (self.module, from_revnum, to_revnum) | ||
) | ||||
Daniel Holth
|
r4765 | |||
try: | ||||
Patrick Mezard
|
r5871 | firstcset = None | ||
Patrick Mezard
|
r6173 | lastonbranch = False | ||
Patrick Mezard
|
r6850 | stream = self._getlog([self.module], from_revnum, to_revnum) | ||
Patrick Mezard
|
r5873 | try: | ||
for entry in stream: | ||||
paths, revnum, author, date, message = entry | ||||
Patrick Mezard
|
r6173 | if revnum < self.startrev: | ||
lastonbranch = True | ||||
break | ||||
Francis Barber
|
r8172 | if not paths: | ||
Augie Fackler
|
r43347 | self.ui.debug(b'revision %d has no entries\n' % revnum) | ||
Patrick Mezard
|
r10618 | # If we ever leave the loop on an empty | ||
# revision, do not try to get a parent branch | ||||
lastonbranch = lastonbranch or revnum == 0 | ||||
Patrick Mezard
|
r5873 | continue | ||
Augie Fackler
|
r43346 | cset, lastonbranch = parselogentry( | ||
paths, revnum, author, date, message | ||||
) | ||||
Patrick Mezard
|
r5873 | if cset: | ||
firstcset = cset | ||||
Patrick Mezard
|
r6173 | if lastonbranch: | ||
Patrick Mezard
|
r5873 | break | ||
finally: | ||||
stream.close() | ||||
Patrick Mezard
|
r5871 | |||
Patrick Mezard
|
r6173 | if not lastonbranch and firstcset and not firstcset.parents: | ||
Patrick Mezard
|
r5871 | # The first revision of the sequence (the last fetched one) | ||
# has invalid parents if not a branch root. Find the parent | ||||
# revision now, if any. | ||||
try: | ||||
firstrevnum = self.revnum(firstcset.rev) | ||||
if firstrevnum > 1: | ||||
latest = self.latest(self.module, firstrevnum - 1) | ||||
Patrick Mezard
|
r5957 | if latest: | ||
firstcset.parents.append(latest) | ||||
Patrick Mezard
|
r7381 | except SvnPathNotFound: | ||
Patrick Mezard
|
r5871 | pass | ||
FUJIWARA Katsunori
|
r28460 | except svn.core.SubversionException as xxx_todo_changeme: | ||
Gregory Szorc
|
r25660 | (inst, num) = xxx_todo_changeme.args | ||
Daniel Holth
|
r4765 | if num == svn.core.SVN_ERR_FS_NO_SUCH_REVISION: | ||
Augie Fackler
|
r43346 | raise error.Abort( | ||
Augie Fackler
|
r43347 | _(b'svn: branch has no revision %s') % to_revnum | ||
Augie Fackler
|
r43346 | ) | ||
Daniel Holth
|
r4765 | raise | ||
Patrick Mezard
|
r11134 | def getfile(self, file, rev): | ||
Daniel Holth
|
r4765 | # TODO: ra.get_file transmits the whole file instead of diffs. | ||
Patrick Mezard
|
r11127 | if file in self.removed: | ||
Mads Kiilerich
|
r22296 | return None, None | ||
Daniel Holth
|
r4765 | try: | ||
Patrick Mezard
|
r13690 | new_module, revnum = revsplit(rev)[1:] | ||
Patrick Mezard
|
r5872 | if self.module != new_module: | ||
self.module = new_module | ||||
Daniel Holth
|
r4765 | self.reparent(self.module) | ||
timeless
|
r28861 | io = stringio() | ||
Daniel Holth
|
r4765 | info = svn.ra.get_file(self.ra, file, revnum, io) | ||
Patrick Mezard
|
r7446 | data = io.getvalue() | ||
Mads Kiilerich
|
r17424 | # ra.get_file() seems to keep a reference on the input buffer | ||
timeless@mozdev.org
|
r17479 | # preventing collection. Release it explicitly. | ||
Patrick Mezard
|
r7446 | io.close() | ||
Daniel Holth
|
r4765 | if isinstance(info, list): | ||
info = info[-1] | ||||
Augie Fackler
|
r43347 | mode = (b"svn:executable" in info) and b'x' or b'' | ||
mode = (b"svn:special" in info) and b'l' or mode | ||||
FUJIWARA Katsunori
|
r28460 | except svn.core.SubversionException as e: | ||
Augie Fackler
|
r43346 | notfound = ( | ||
svn.core.SVN_ERR_FS_NOT_FOUND, | ||||
svn.core.SVN_ERR_RA_DAV_PATH_NOT_FOUND, | ||||
) | ||||
if e.apr_err in notfound: # File not found | ||||
Mads Kiilerich
|
r22296 | return None, None | ||
Daniel Holth
|
r4765 | raise | ||
Augie Fackler
|
r43347 | if mode == b'l': | ||
link_prefix = b"link " | ||||
Daniel Holth
|
r4765 | if data.startswith(link_prefix): | ||
Augie Fackler
|
r43346 | data = data[len(link_prefix) :] | ||
Daniel Holth
|
r4765 | return data, mode | ||
Patrick Mezard
|
r11133 | def _iterfiles(self, path, revnum): | ||
"""Enumerate all files in path at revnum, recursively.""" | ||||
Augie Fackler
|
r43347 | path = path.strip(b'/') | ||
FUJIWARA Katsunori
|
r28460 | pool = svn.core.Pool() | ||
Augie Fackler
|
r43347 | rpath = b'/'.join([self.baseurl, quote(path)]).strip(b'/') | ||
Matt Mackall
|
r11167 | entries = svn.client.ls(rpath, optrev(revnum), True, self.ctx, pool) | ||
Patrick Mezard
|
r13651 | if path: | ||
Augie Fackler
|
r43347 | path += b'/' | ||
Augie Fackler
|
r43346 | return ( | ||
(path + p) | ||||
Gregory Szorc
|
r49768 | for p, e in entries.items() | ||
Augie Fackler
|
r43346 | if e.kind == svn.core.svn_node_file | ||
) | ||||
Bryan O'Sullivan
|
r5513 | |||
Patrick Mezard
|
r6539 | def getrelpath(self, path, module=None): | ||
if module is None: | ||||
module = self.module | ||||
# Given the repository url of this wc, say | ||||
# "http://server/plone/CMFPlone/branches/Plone-2_0-branch" | ||||
# extract the "entry" portion (a relative path) from what | ||||
Mads Kiilerich
|
r17424 | # svn log --xml says, i.e. | ||
Patrick Mezard
|
r6539 | # "/CMFPlone/branches/Plone-2_0-branch/tests/PloneTestCase.py" | ||
# that is to say "tests/PloneTestCase.py" | ||||
if path.startswith(module): | ||||
Augie Fackler
|
r43347 | relative = path.rstrip(b'/')[len(module) :] | ||
if relative.startswith(b'/'): | ||||
Patrick Mezard
|
r6539 | return relative[1:] | ||
Augie Fackler
|
r43347 | elif relative == b'': | ||
Patrick Mezard
|
r6539 | return relative | ||
# The path is outside our tracked tree... | ||||
Manuel Jacob
|
r45497 | self.ui.debug( | ||
b'%r is not under %r, ignoring\n' | ||||
% (pycompat.bytestr(path), pycompat.bytestr(module)) | ||||
) | ||||
Patrick Mezard
|
r6539 | return None | ||
Patrick Mezard
|
r11128 | def _checkpath(self, path, revnum, module=None): | ||
if module is not None: | ||||
Augie Fackler
|
r43347 | prevmodule = self.reparent(b'') | ||
path = module + b'/' + path | ||||
Patrick Mezard
|
r11128 | try: | ||
# ra.check_path does not like leading slashes very much, it leads | ||||
# to PROPFIND subversion errors | ||||
Augie Fackler
|
r43347 | return svn.ra.check_path(self.ra, path.strip(b'/'), revnum) | ||
Patrick Mezard
|
r11128 | finally: | ||
if module is not None: | ||||
self.reparent(prevmodule) | ||||
Martin Geisler
|
r12770 | |||
Augie Fackler
|
r43346 | def _getlog( | ||
self, | ||||
paths, | ||||
start, | ||||
end, | ||||
limit=0, | ||||
discover_changed_paths=True, | ||||
strict_node_history=False, | ||||
): | ||||
Patrick Mezard
|
r6850 | # Normalize path names, svn >= 1.5 only wants paths relative to | ||
# supplied URL | ||||
relpaths = [] | ||||
for p in paths: | ||||
Augie Fackler
|
r43347 | if not p.startswith(b'/'): | ||
p = self.module + b'/' + p | ||||
relpaths.append(p.strip(b'/')) | ||||
Augie Fackler
|
r43346 | args = [ | ||
self.baseurl, | ||||
relpaths, | ||||
start, | ||||
end, | ||||
limit, | ||||
discover_changed_paths, | ||||
strict_node_history, | ||||
] | ||||
timeless
|
r27314 | # developer config: convert.svn.debugsvnlog | ||
Augie Fackler
|
r43347 | if not self.ui.configbool(b'convert', b'svn.debugsvnlog'): | ||
Mads Kiilerich
|
r20420 | return directlogstream(*args) | ||
Patrick Mezard
|
r6850 | arg = encodeargs(args) | ||
Yuya Nishihara
|
r37138 | hgexe = procutil.hgexecutable() | ||
Augie Fackler
|
r43347 | cmd = b'%s debugsvnlog' % procutil.shellquote(hgexe) | ||
Manuel Jacob
|
r45403 | stdin, stdout = procutil.popen2(cmd) | ||
Patrick Mezard
|
r6850 | stdin.write(arg) | ||
Patrick Mezard
|
r10071 | try: | ||
stdin.close() | ||||
except IOError: | ||||
Augie Fackler
|
r43346 | raise error.Abort( | ||
_( | ||||
Augie Fackler
|
r43347 | b'Mercurial failed to run itself, check' | ||
b' hg executable is in PATH' | ||||
Augie Fackler
|
r43346 | ) | ||
) | ||||
Patrick Mezard
|
r6850 | return logstream(stdout) | ||
Augie Fackler
|
r43346 | |||
Nikita Slyusarev
|
r47129 | pre_revprop_change_template = b'''#!/bin/sh | ||
Bryan O'Sullivan
|
r5513 | |||
REPOS="$1" | ||||
REV="$2" | ||||
USER="$3" | ||||
PROPNAME="$4" | ||||
ACTION="$5" | ||||
Nikita Slyusarev
|
r47129 | %(rules)s | ||
Bryan O'Sullivan
|
r5513 | |||
echo "Changing prohibited revision property" >&2 | ||||
exit 1 | ||||
''' | ||||
Augie Fackler
|
r43346 | |||
Nikita Slyusarev
|
r47129 | def gen_pre_revprop_change_hook(prop_actions_allowed): | ||
rules = [] | ||||
for action, propname in prop_actions_allowed: | ||||
rules.append( | ||||
( | ||||
b'if [ "$ACTION" = "%s" -a "$PROPNAME" = "%s" ]; ' | ||||
b'then exit 0; fi' | ||||
) | ||||
% (action, propname) | ||||
) | ||||
return pre_revprop_change_template % {b'rules': b'\n'.join(rules)} | ||||
Bryan O'Sullivan
|
r5513 | class svn_sink(converter_sink, commandline): | ||
Pulkit Goyal
|
r38079 | commit_re = re.compile(br'Committed revision (\d+).', re.M) | ||
uuid_re = re.compile(br'Repository UUID:\s*(\S+)', re.M) | ||||
Bryan O'Sullivan
|
r5513 | |||
def prerun(self): | ||||
if self.wc: | ||||
os.chdir(self.wc) | ||||
def postrun(self): | ||||
if self.wc: | ||||
os.chdir(self.cwd) | ||||
def join(self, name): | ||||
Augie Fackler
|
r43347 | return os.path.join(self.wc, b'.svn', name) | ||
Thomas Arendsen Hein
|
r5760 | |||
Bryan O'Sullivan
|
r5513 | def revmapfile(self): | ||
Augie Fackler
|
r43347 | return self.join(b'hg-shamap') | ||
Bryan O'Sullivan
|
r5513 | |||
def authorfile(self): | ||||
Augie Fackler
|
r43347 | return self.join(b'hg-authormap') | ||
Bryan O'Sullivan
|
r5513 | |||
Matt Harbison
|
r35168 | def __init__(self, ui, repotype, path): | ||
Azhagu Selvan SP
|
r13480 | |||
Matt Harbison
|
r35168 | converter_sink.__init__(self, ui, repotype, path) | ||
Augie Fackler
|
r43347 | commandline.__init__(self, ui, b'svn') | ||
Bryan O'Sullivan
|
r5513 | self.delete = [] | ||
Maxim Dounin
|
r5698 | self.setexec = [] | ||
self.delexec = [] | ||||
self.copies = [] | ||||
Bryan O'Sullivan
|
r5513 | self.wc = None | ||
Matt Harbison
|
r39843 | self.cwd = encoding.getcwd() | ||
Bryan O'Sullivan
|
r5513 | |||
created = False | ||||
Augie Fackler
|
r43347 | if os.path.isfile(os.path.join(path, b'.svn', b'entries')): | ||
Patrick Mezard
|
r17247 | self.wc = os.path.realpath(path) | ||
Augie Fackler
|
r43347 | self.run0(b'update') | ||
Bryan O'Sullivan
|
r5513 | else: | ||
Matt Harbison
|
r44474 | if not re.search(br'^(file|http|https|svn|svn\+ssh)://', path): | ||
Patrick Mezard
|
r17247 | path = os.path.realpath(path) | ||
if os.path.isdir(os.path.dirname(path)): | ||||
Augie Fackler
|
r43347 | if not os.path.exists( | ||
os.path.join(path, b'db', b'fs-type') | ||||
): | ||||
Augie Fackler
|
r43346 | ui.status( | ||
Augie Fackler
|
r43347 | _(b"initializing svn repository '%s'\n") | ||
Augie Fackler
|
r43346 | % os.path.basename(path) | ||
) | ||||
Augie Fackler
|
r43347 | commandline(ui, b'svnadmin').run0(b'create', path) | ||
Patrick Mezard
|
r17247 | created = path | ||
path = util.normpath(path) | ||||
Augie Fackler
|
r43347 | if not path.startswith(b'/'): | ||
path = b'/' + path | ||||
path = b'file://' + path | ||||
Patrick Mezard
|
r5535 | |||
Augie Fackler
|
r43346 | wcpath = os.path.join( | ||
Augie Fackler
|
r43347 | encoding.getcwd(), os.path.basename(path) + b'-wc' | ||
Augie Fackler
|
r43346 | ) | ||
ui.status( | ||||
Augie Fackler
|
r43347 | _(b"initializing svn working copy '%s'\n") | ||
Augie Fackler
|
r43346 | % os.path.basename(wcpath) | ||
) | ||||
Augie Fackler
|
r43347 | self.run0(b'checkout', path, wcpath) | ||
Bryan O'Sullivan
|
r5513 | |||
self.wc = wcpath | ||||
Pierre-Yves David
|
r31246 | self.opener = vfsmod.vfs(self.wc) | ||
self.wopener = vfsmod.vfs(self.wc) | ||||
Augie Fackler
|
r43347 | self.childmap = mapfile(ui, self.join(b'hg-childmap')) | ||
Jordi Gutiérrez Hermoso
|
r24306 | if util.checkexec(self.wc): | ||
self.is_exec = util.isexec | ||||
else: | ||||
self.is_exec = None | ||||
Bryan O'Sullivan
|
r5513 | |||
if created: | ||||
Nikita Slyusarev
|
r47129 | prop_actions_allowed = [ | ||
(b'M', b'svn:log'), | ||||
(b'A', b'hg:convert-branch'), | ||||
(b'A', b'hg:convert-rev'), | ||||
] | ||||
if self.ui.configbool( | ||||
b'convert', b'svn.dangerous-set-commit-dates' | ||||
): | ||||
prop_actions_allowed.append((b'M', b'svn:date')) | ||||
Augie Fackler
|
r43347 | hook = os.path.join(created, b'hooks', b'pre-revprop-change') | ||
fp = open(hook, b'wb') | ||||
Nikita Slyusarev
|
r47129 | fp.write(gen_pre_revprop_change_hook(prop_actions_allowed)) | ||
Bryan O'Sullivan
|
r5513 | fp.close() | ||
Adrian Buehlmann
|
r14232 | util.setflags(hook, False, True) | ||
Bryan O'Sullivan
|
r5513 | |||
Augie Fackler
|
r43347 | output = self.run0(b'info') | ||
Patrick Mezard
|
r13530 | self.uuid = self.uuid_re.search(output).group(1).strip() | ||
Bryan O'Sullivan
|
r5554 | |||
Bryan O'Sullivan
|
r5513 | def wjoin(self, *names): | ||
return os.path.join(self.wc, *names) | ||||
Patrick Mezard
|
r16511 | @propertycache | ||
def manifest(self): | ||||
# As of svn 1.7, the "add" command fails when receiving | ||||
# already tracked entries, so we have to track and filter them | ||||
# ourselves. | ||||
m = set() | ||||
Augie Fackler
|
r43347 | output = self.run0(b'ls', recursive=True, xml=True) | ||
Patrick Mezard
|
r16511 | doc = xml.dom.minidom.parseString(output) | ||
Augie Fackler
|
r43906 | for e in doc.getElementsByTagName('entry'): | ||
Patrick Mezard
|
r16511 | for n in e.childNodes: | ||
Augie Fackler
|
r43906 | if n.nodeType != n.ELEMENT_NODE or n.tagName != 'name': | ||
Patrick Mezard
|
r16511 | continue | ||
Augie Fackler
|
r43906 | name = ''.join( | ||
Augie Fackler
|
r43346 | c.data for c in n.childNodes if c.nodeType == c.TEXT_NODE | ||
) | ||||
Patrick Mezard
|
r16511 | # Entries are compared with names coming from | ||
# mercurial, so bytes with undefined encoding. Our | ||||
# best bet is to assume they are in local | ||||
# encoding. They will be passed to command line calls | ||||
# later anyway, so they better be. | ||||
Yuya Nishihara
|
r31447 | m.add(encoding.unitolocal(name)) | ||
Patrick Mezard
|
r16511 | break | ||
return m | ||||
Bryan O'Sullivan
|
r5513 | def putfile(self, filename, flags, data): | ||
Augie Fackler
|
r43347 | if b'l' in flags: | ||
Bryan O'Sullivan
|
r5513 | self.wopener.symlink(data, filename) | ||
else: | ||||
try: | ||||
if os.path.islink(self.wjoin(filename)): | ||||
os.unlink(filename) | ||||
except OSError: | ||||
pass | ||||
Nikita Slyusarev
|
r41766 | |||
if self.is_exec: | ||||
# We need to check executability of the file before the change, | ||||
# because `vfs.write` is able to reset exec bit. | ||||
wasexec = False | ||||
if os.path.exists(self.wjoin(filename)): | ||||
wasexec = self.is_exec(self.wjoin(filename)) | ||||
Dan Villiom Podlaski Christiansen
|
r14168 | self.wopener.write(filename, data) | ||
Patrick Mezard
|
r5536 | |||
if self.is_exec: | ||||
Nikita Slyusarev
|
r41766 | if wasexec: | ||
Augie Fackler
|
r43347 | if b'x' not in flags: | ||
Mads Kiilerich
|
r17031 | self.delexec.append(filename) | ||
else: | ||||
Augie Fackler
|
r43347 | if b'x' in flags: | ||
Mads Kiilerich
|
r17031 | self.setexec.append(filename) | ||
Augie Fackler
|
r43347 | util.setflags(self.wjoin(filename), False, b'x' in flags) | ||
Maxim Dounin
|
r5698 | |||
def _copyfile(self, source, dest): | ||||
Bryan O'Sullivan
|
r5513 | # SVN's copy command pukes if the destination file exists, but | ||
# our copyfile method expects to record a copy that has | ||||
# already occurred. Cross the semantic gap. | ||||
wdest = self.wjoin(dest) | ||||
Patrick Mezard
|
r12343 | exists = os.path.lexists(wdest) | ||
Bryan O'Sullivan
|
r5513 | if exists: | ||
Yuya Nishihara
|
r38182 | fd, tempname = pycompat.mkstemp( | ||
Augie Fackler
|
r43347 | prefix=b'hg-copy-', dir=os.path.dirname(wdest) | ||
Augie Fackler
|
r43346 | ) | ||
Bryan O'Sullivan
|
r5513 | os.close(fd) | ||
os.unlink(tempname) | ||||
os.rename(wdest, tempname) | ||||
try: | ||||
Augie Fackler
|
r43347 | self.run0(b'copy', source, dest) | ||
Bryan O'Sullivan
|
r5513 | finally: | ||
Patrick Mezard
|
r16511 | self.manifest.add(dest) | ||
Bryan O'Sullivan
|
r5513 | if exists: | ||
try: | ||||
os.unlink(wdest) | ||||
except OSError: | ||||
pass | ||||
os.rename(tempname, wdest) | ||||
def dirs_of(self, files): | ||||
Martin Geisler
|
r8150 | dirs = set() | ||
Bryan O'Sullivan
|
r5513 | for f in files: | ||
if os.path.isdir(self.wjoin(f)): | ||||
dirs.add(f) | ||||
Yuya Nishihara
|
r30605 | i = len(f) | ||
Augie Fackler
|
r43347 | for i in iter(lambda: f.rfind(b'/', 0, i), -1): | ||
Bryan O'Sullivan
|
r5513 | dirs.add(f[:i]) | ||
return dirs | ||||
Maxim Dounin
|
r5698 | def add_dirs(self, files): | ||
Augie Fackler
|
r43346 | add_dirs = [ | ||
d for d in sorted(self.dirs_of(files)) if d not in self.manifest | ||||
] | ||||
Bryan O'Sullivan
|
r5513 | if add_dirs: | ||
Patrick Mezard
|
r16511 | self.manifest.update(add_dirs) | ||
Augie Fackler
|
r43347 | self.xargs(add_dirs, b'add', non_recursive=True, quiet=True) | ||
Maxim Dounin
|
r5698 | return add_dirs | ||
def add_files(self, files): | ||||
Patrick Mezard
|
r16511 | files = [f for f in files if f not in self.manifest] | ||
Bryan O'Sullivan
|
r5513 | if files: | ||
Patrick Mezard
|
r16511 | self.manifest.update(files) | ||
Augie Fackler
|
r43347 | self.xargs(files, b'add', quiet=True) | ||
Maxim Dounin
|
r5698 | return files | ||
Thomas Arendsen Hein
|
r5760 | |||
Bryan O'Sullivan
|
r5513 | def addchild(self, parent, child): | ||
self.childmap[parent] = child | ||||
Bryan O'Sullivan
|
r5554 | def revid(self, rev): | ||
Augie Fackler
|
r43347 | return b"svn:%s@%s" % (self.uuid, rev) | ||
Maxim Dounin
|
r5698 | |||
Augie Fackler
|
r43346 | def putcommit( | ||
self, files, copies, parents, commit, source, revmap, full, cleanp2 | ||||
): | ||||
Patrick Mezard
|
r15605 | for parent in parents: | ||
try: | ||||
return self.revid(self.childmap[parent]) | ||||
except KeyError: | ||||
pass | ||||
Patrick Mezard
|
r6716 | # Apply changes to working copy | ||
for f, v in files: | ||||
Mads Kiilerich
|
r22296 | data, mode = source.getfile(f, v) | ||
if data is None: | ||||
Patrick Mezard
|
r6716 | self.delete.append(f) | ||
else: | ||||
Patrick Mezard
|
r11134 | self.putfile(f, mode, data) | ||
Patrick Mezard
|
r6716 | if f in copies: | ||
self.copies.append([copies[f], f]) | ||||
Mads Kiilerich
|
r22300 | if full: | ||
self.delete.extend(sorted(self.manifest.difference(files))) | ||||
Patrick Mezard
|
r6716 | files = [f[0] for f in files] | ||
Martin Geisler
|
r8150 | entries = set(self.delete) | ||
files = frozenset(files) | ||||
Maxim Dounin
|
r5698 | entries.update(self.add_dirs(files.difference(entries))) | ||
if self.copies: | ||||
for s, d in self.copies: | ||||
self._copyfile(s, d) | ||||
self.copies = [] | ||||
Bryan O'Sullivan
|
r5513 | if self.delete: | ||
Augie Fackler
|
r43347 | self.xargs(self.delete, b'delete') | ||
Patrick Mezard
|
r16511 | for f in self.delete: | ||
self.manifest.remove(f) | ||||
Bryan O'Sullivan
|
r5513 | self.delete = [] | ||
entries.update(self.add_files(files.difference(entries))) | ||||
Maxim Dounin
|
r5698 | if self.delexec: | ||
Augie Fackler
|
r43347 | self.xargs(self.delexec, b'propdel', b'svn:executable') | ||
Maxim Dounin
|
r5698 | self.delexec = [] | ||
if self.setexec: | ||||
Augie Fackler
|
r43347 | self.xargs(self.setexec, b'propset', b'svn:executable', b'*') | ||
Maxim Dounin
|
r5698 | self.setexec = [] | ||
Augie Fackler
|
r43347 | fd, messagefile = pycompat.mkstemp(prefix=b'hg-convert-') | ||
Augie Fackler
|
r43906 | fp = os.fdopen(fd, 'wb') | ||
Yuya Nishihara
|
r36166 | fp.write(util.tonativeeol(commit.desc)) | ||
Bryan O'Sullivan
|
r5513 | fp.close() | ||
try: | ||||
Augie Fackler
|
r43346 | output = self.run0( | ||
Augie Fackler
|
r43347 | b'commit', | ||
Augie Fackler
|
r43346 | username=stringutil.shortuser(commit.author), | ||
file=messagefile, | ||||
Augie Fackler
|
r43347 | encoding=b'utf-8', | ||
Augie Fackler
|
r43346 | ) | ||
Bryan O'Sullivan
|
r5513 | try: | ||
rev = self.commit_re.search(output).group(1) | ||||
except AttributeError: | ||||
Nikita Slyusarev
|
r41765 | if not files: | ||
Augie Fackler
|
r43347 | return parents[0] if parents else b'None' | ||
self.ui.warn(_(b'unexpected svn output:\n')) | ||||
Bryan O'Sullivan
|
r5513 | self.ui.warn(output) | ||
Augie Fackler
|
r43347 | raise error.Abort(_(b'unable to cope with svn output')) | ||
Bryan O'Sullivan
|
r5513 | if commit.rev: | ||
Augie Fackler
|
r43346 | self.run( | ||
Augie Fackler
|
r43347 | b'propset', | ||
b'hg:convert-rev', | ||||
Augie Fackler
|
r43346 | commit.rev, | ||
revprop=True, | ||||
revision=rev, | ||||
) | ||||
Augie Fackler
|
r43347 | if commit.branch and commit.branch != b'default': | ||
Augie Fackler
|
r43346 | self.run( | ||
Augie Fackler
|
r43347 | b'propset', | ||
b'hg:convert-branch', | ||||
Augie Fackler
|
r43346 | commit.branch, | ||
revprop=True, | ||||
revision=rev, | ||||
) | ||||
Nikita Slyusarev
|
r47129 | |||
if self.ui.configbool( | ||||
b'convert', b'svn.dangerous-set-commit-dates' | ||||
): | ||||
# Subverson always uses UTC to represent date and time | ||||
date = dateutil.parsedate(commit.date) | ||||
date = (date[0], 0) | ||||
# The only way to set date and time for svn commit is to use propset after commit is done | ||||
self.run( | ||||
b'propset', | ||||
b'svn:date', | ||||
formatsvndate(date), | ||||
revprop=True, | ||||
revision=rev, | ||||
) | ||||
Bryan O'Sullivan
|
r5513 | for parent in parents: | ||
self.addchild(parent, rev) | ||||
Bryan O'Sullivan
|
r5554 | return self.revid(rev) | ||
Bryan O'Sullivan
|
r5513 | finally: | ||
os.unlink(messagefile) | ||||
def puttags(self, tags): | ||||
Augie Fackler
|
r43347 | self.ui.warn(_(b'writing Subversion tags is not yet implemented\n')) | ||
Daniel J. Lauk
|
r11778 | return None, None | ||
Patrick Mezard
|
r16106 | |||
Mads Kiilerich
|
r21635 | def hascommitfrommap(self, rev): | ||
# We trust that revisions referenced in a map still is present | ||||
# TODO: implement something better if necessary and feasible | ||||
return True | ||||
Mads Kiilerich
|
r21634 | def hascommitforsplicemap(self, rev): | ||
Patrick Mezard
|
r16106 | # This is not correct as one can convert to an existing subversion | ||
# repository and childmap would not list all revisions. Too bad. | ||||
if rev in self.childmap: | ||||
return True | ||||
Augie Fackler
|
r43346 | raise error.Abort( | ||
_( | ||||
Augie Fackler
|
r43347 | b'splice map revision %s not found in subversion ' | ||
b'child map (revision lookups are not implemented)' | ||||
Augie Fackler
|
r43346 | ) | ||
% rev | ||||
) | ||||