changelog.py
349 lines
| 11.7 KiB
| text/x-python
|
PythonLexer
/ mercurial / changelog.py
mpm@selenic.com
|
r1095 | # changelog.py - changelog class for mercurial | ||
mpm@selenic.com
|
r1089 | # | ||
Thomas Arendsen Hein
|
r4635 | # Copyright 2005-2007 Matt Mackall <mpm@selenic.com> | ||
mpm@selenic.com
|
r1089 | # | ||
Martin Geisler
|
r8225 | # This software may be used and distributed according to the terms of the | ||
Matt Mackall
|
r10263 | # GNU General Public License version 2 or any later version. | ||
mpm@selenic.com
|
r1089 | |||
Joel Rosdahl
|
r6211 | from node import bin, hex, nullid | ||
Benoit Boissinot
|
r7035 | from i18n import _ | ||
Matt Mackall
|
r7948 | import util, error, revlog, encoding | ||
mpm@selenic.com
|
r1089 | |||
Matt Mackall
|
r16267 | _defaultextra = {'branch': 'default'} | ||
Benoit Boissinot
|
r3232 | def _string_escape(text): | ||
""" | ||||
>>> d = {'nl': chr(10), 'bs': chr(92), 'cr': chr(13), 'nul': chr(0)} | ||||
>>> s = "ab%(nl)scd%(bs)s%(bs)sn%(nul)sab%(cr)scd%(bs)s%(nl)s" % d | ||||
>>> s | ||||
'ab\\ncd\\\\\\\\n\\x00ab\\rcd\\\\\\n' | ||||
>>> res = _string_escape(s) | ||||
Matt Mackall
|
r5745 | >>> s == res.decode('string_escape') | ||
Benoit Boissinot
|
r3232 | True | ||
""" | ||||
# subset of the string_escape codec | ||||
text = text.replace('\\', '\\\\').replace('\n', '\\n').replace('\r', '\\r') | ||||
return text.replace('\0', '\\0') | ||||
Martin Geisler
|
r8443 | def decodeextra(text): | ||
Matt Mackall
|
r15661 | """ | ||
Mads Kiilerich
|
r18379 | >>> sorted(decodeextra(encodeextra({'foo': 'bar', 'baz': chr(0) + '2'}) | ||
... ).iteritems()) | ||||
[('baz', '\\x002'), ('branch', 'default'), ('foo', 'bar')] | ||||
>>> sorted(decodeextra(encodeextra({'foo': 'bar', | ||||
... 'baz': chr(92) + chr(0) + '2'}) | ||||
... ).iteritems()) | ||||
[('baz', '\\\\\\x002'), ('branch', 'default'), ('foo', 'bar')] | ||||
Matt Mackall
|
r15661 | """ | ||
Matt Mackall
|
r16267 | extra = _defaultextra.copy() | ||
Martin Geisler
|
r8443 | for l in text.split('\0'): | ||
if l: | ||||
Matt Mackall
|
r15661 | if '\\0' in l: | ||
# fix up \0 without getting into trouble with \\0 | ||||
l = l.replace('\\\\', '\\\\\n') | ||||
l = l.replace('\\0', '\0') | ||||
l = l.replace('\n', '') | ||||
Martin Geisler
|
r8443 | k, v = l.decode('string_escape').split(':', 1) | ||
extra[k] = v | ||||
return extra | ||||
def encodeextra(d): | ||||
# keys must be sorted to produce a deterministic changelog entry | ||||
items = [_string_escape('%s:%s' % (k, d[k])) for k in sorted(d)] | ||||
return "\0".join(items) | ||||
Pierre-Yves David
|
r17810 | def stripdesc(desc): | ||
"""strip trailing whitespace and leading and trailing empty lines""" | ||||
return '\n'.join([l.rstrip() for l in desc.splitlines()]).strip('\n') | ||||
Benoit Boissinot
|
r8778 | class appender(object): | ||
timeless
|
r7807 | '''the changelog index must be updated last on disk, so we use this class | ||
Matt Mackall
|
r4261 | to delay writes to it''' | ||
def __init__(self, fp, buf): | ||||
self.data = buf | ||||
self.fp = fp | ||||
self.offset = fp.tell() | ||||
self.size = util.fstat(fp).st_size | ||||
def end(self): | ||||
return self.size + len("".join(self.data)) | ||||
def tell(self): | ||||
return self.offset | ||||
def flush(self): | ||||
pass | ||||
def close(self): | ||||
Benoit Boissinot
|
r4961 | self.fp.close() | ||
Matt Mackall
|
r4261 | |||
def seek(self, offset, whence=0): | ||||
'''virtual file offset spans real file and data''' | ||||
if whence == 0: | ||||
self.offset = offset | ||||
elif whence == 1: | ||||
self.offset += offset | ||||
elif whence == 2: | ||||
self.offset = self.end() + offset | ||||
if self.offset < self.size: | ||||
self.fp.seek(self.offset) | ||||
def read(self, count=-1): | ||||
'''only trick here is reads that span real file and data''' | ||||
ret = "" | ||||
if self.offset < self.size: | ||||
s = self.fp.read(count) | ||||
ret = s | ||||
self.offset += len(s) | ||||
if count > 0: | ||||
count -= len(s) | ||||
if count != 0: | ||||
doff = self.offset - self.size | ||||
self.data.insert(0, "".join(self.data)) | ||||
del self.data[1:] | ||||
Matt Mackall
|
r10282 | s = self.data[0][doff:doff + count] | ||
Matt Mackall
|
r4261 | self.offset += len(s) | ||
ret += s | ||||
return ret | ||||
def write(self, s): | ||||
Matt Mackall
|
r5450 | self.data.append(str(s)) | ||
Matt Mackall
|
r4261 | self.offset += len(s) | ||
Matt Mackall
|
r9166 | def delayopener(opener, target, divert, buf): | ||
def o(name, mode='r'): | ||||
if name != target: | ||||
return opener(name, mode) | ||||
if divert: | ||||
return opener(name + ".a", mode.replace('a', 'w')) | ||||
# otherwise, divert to memory | ||||
return appender(opener(name, mode), buf) | ||||
return o | ||||
Matt Mackall
|
r7634 | class changelog(revlog.revlog): | ||
Matt Mackall
|
r4258 | def __init__(self, opener): | ||
Matt Mackall
|
r9165 | revlog.revlog.__init__(self, opener, "00changelog.i") | ||
Sune Foldager
|
r14334 | if self._initempty: | ||
# changelogs don't benefit from generaldelta | ||||
self.version &= ~revlog.REVLOGGENERALDELTA | ||||
self._generaldelta = False | ||||
Matt Mackall
|
r8644 | self._realopener = opener | ||
self._delayed = False | ||||
Matt Mackall
|
r9163 | self._divert = False | ||
Pierre-Yves David
|
r18231 | self.filteredrevs = frozenset() | ||
Pierre-Yves David
|
r17677 | |||
def tip(self): | ||||
"""filtered version of revlog.tip""" | ||||
for i in xrange(len(self) -1, -2, -1): | ||||
if i not in self.filteredrevs: | ||||
return self.node(i) | ||||
def __iter__(self): | ||||
"""filtered version of revlog.__iter__""" | ||||
Durham Goode
|
r17951 | if len(self.filteredrevs) == 0: | ||
return revlog.revlog.__iter__(self) | ||||
def filterediter(): | ||||
for i in xrange(len(self)): | ||||
if i not in self.filteredrevs: | ||||
yield i | ||||
return filterediter() | ||||
Pierre-Yves David
|
r17677 | |||
def revs(self, start=0, stop=None): | ||||
"""filtered version of revlog.revs""" | ||||
for i in super(changelog, self).revs(start, stop): | ||||
if i not in self.filteredrevs: | ||||
yield i | ||||
@util.propertycache | ||||
def nodemap(self): | ||||
# XXX need filtering too | ||||
self.rev(self.node(0)) | ||||
return self._nodecache | ||||
def hasnode(self, node): | ||||
"""filtered version of revlog.hasnode""" | ||||
try: | ||||
i = self.rev(node) | ||||
return i not in self.filteredrevs | ||||
except KeyError: | ||||
return False | ||||
def headrevs(self): | ||||
if self.filteredrevs: | ||||
# XXX we should fix and use the C version | ||||
return self._headrevs() | ||||
return super(changelog, self).headrevs() | ||||
def strip(self, *args, **kwargs): | ||||
# XXX make something better than assert | ||||
# We can't expect proper strip behavior if we are filtered. | ||||
assert not self.filteredrevs | ||||
super(changelog, self).strip(*args, **kwargs) | ||||
def rev(self, node): | ||||
"""filtered version of revlog.rev""" | ||||
r = super(changelog, self).rev(node) | ||||
if r in self.filteredrevs: | ||||
raise error.LookupError(node, self.indexfile, _('no node')) | ||||
return r | ||||
def node(self, rev): | ||||
"""filtered version of revlog.node""" | ||||
if rev in self.filteredrevs: | ||||
raise IndexError(rev) | ||||
return super(changelog, self).node(rev) | ||||
def linkrev(self, rev): | ||||
"""filtered version of revlog.linkrev""" | ||||
if rev in self.filteredrevs: | ||||
raise IndexError(rev) | ||||
return super(changelog, self).linkrev(rev) | ||||
def parentrevs(self, rev): | ||||
"""filtered version of revlog.parentrevs""" | ||||
if rev in self.filteredrevs: | ||||
raise IndexError(rev) | ||||
return super(changelog, self).parentrevs(rev) | ||||
def flags(self, rev): | ||||
"""filtered version of revlog.flags""" | ||||
if rev in self.filteredrevs: | ||||
raise IndexError(rev) | ||||
return super(changelog, self).flags(rev) | ||||
mpm@selenic.com
|
r1089 | |||
Matt Mackall
|
r4261 | def delayupdate(self): | ||
"delay visibility of index updates to other readers" | ||||
Matt Mackall
|
r8644 | self._delayed = True | ||
Matt Mackall
|
r9163 | self._divert = (len(self) == 0) | ||
Matt Mackall
|
r4261 | self._delaybuf = [] | ||
Matt Mackall
|
r9166 | self.opener = delayopener(self._realopener, self.indexfile, | ||
self._divert, self._delaybuf) | ||||
Matt Mackall
|
r4261 | |||
def finalize(self, tr): | ||||
"finalize index updates" | ||||
Matt Mackall
|
r8644 | self._delayed = False | ||
Matt Mackall
|
r9165 | self.opener = self._realopener | ||
Matt Mackall
|
r4269 | # move redirected index data back into place | ||
Matt Mackall
|
r9164 | if self._divert: | ||
Zachary Gramana
|
r14207 | nfile = self.opener(self.indexfile + ".a") | ||
n = nfile.name | ||||
nfile.close() | ||||
Matt Mackall
|
r9166 | util.rename(n, n[:-2]) | ||
Matt Mackall
|
r4269 | elif self._delaybuf: | ||
Matt Mackall
|
r4261 | fp = self.opener(self.indexfile, 'a') | ||
fp.write("".join(self._delaybuf)) | ||||
fp.close() | ||||
Matt Mackall
|
r7787 | self._delaybuf = [] | ||
Matt Mackall
|
r4269 | # split when we're done | ||
Matt Mackall
|
r4261 | self.checkinlinesize(tr) | ||
Matt Mackall
|
r7787 | def readpending(self, file): | ||
r = revlog.revlog(self.opener, file) | ||||
self.index = r.index | ||||
self.nodemap = r.nodemap | ||||
Bryan O'Sullivan
|
r16619 | self._nodecache = r._nodecache | ||
Matt Mackall
|
r7787 | self._chunkcache = r._chunkcache | ||
def writepending(self): | ||||
"create a file containing the unfinalized state for pretxnchangegroup" | ||||
if self._delaybuf: | ||||
# make a temporary copy of the index | ||||
fp1 = self._realopener(self.indexfile) | ||||
fp2 = self._realopener(self.indexfile + ".a", "w") | ||||
fp2.write(fp1.read()) | ||||
# add pending data | ||||
fp2.write("".join(self._delaybuf)) | ||||
fp2.close() | ||||
# switch modes so finalize can simply rename | ||||
self._delaybuf = [] | ||||
Matt Mackall
|
r9164 | self._divert = True | ||
Matt Mackall
|
r7787 | |||
Matt Mackall
|
r9164 | if self._divert: | ||
Matt Mackall
|
r7787 | return True | ||
return False | ||||
Matt Mackall
|
r4261 | def checkinlinesize(self, tr, fp=None): | ||
Matt Mackall
|
r9165 | if not self._delayed: | ||
revlog.revlog.checkinlinesize(self, tr, fp) | ||||
Matt Mackall
|
r4261 | |||
Matt Mackall
|
r5744 | def read(self, node): | ||
Benoit Boissinot
|
r3077 | """ | ||
format used: | ||||
Benoit Boissinot
|
r3233 | nodeid\n : manifest node in ascii | ||
user\n : user, no \n or \r allowed | ||||
time tz extra\n : date (time is int or float, timezone is int) | ||||
Mads Kiilerich
|
r17424 | : extra is metadata, encoded and separated by '\0' | ||
Benoit Boissinot
|
r3233 | : older versions ignore it | ||
files\n\n : files modified by the cset, no \n or \r allowed | ||||
(.*) : comment (free text, ideally utf-8) | ||||
changelog v0 doesn't use extra | ||||
Benoit Boissinot
|
r3077 | """ | ||
Matt Mackall
|
r5744 | text = self.revision(node) | ||
mpm@selenic.com
|
r1089 | if not text: | ||
Matt Mackall
|
r16267 | return (nullid, "", (0, 0), [], "", _defaultextra) | ||
mpm@selenic.com
|
r1089 | last = text.index("\n\n") | ||
Matt Mackall
|
r7948 | desc = encoding.tolocal(text[last + 2:]) | ||
Benoit Boissinot
|
r3233 | l = text[:last].split('\n') | ||
mpm@selenic.com
|
r1089 | manifest = bin(l[0]) | ||
Matt Mackall
|
r7948 | user = encoding.tolocal(l[1]) | ||
Benoit Boissinot
|
r3233 | |||
Matt Mackall
|
r16267 | tdata = l[2].split(' ', 2) | ||
if len(tdata) != 3: | ||||
time = float(tdata[0]) | ||||
Benoit Boissinot
|
r3233 | try: | ||
# various tools did silly things with the time zone field. | ||||
Matt Mackall
|
r16267 | timezone = int(tdata[1]) | ||
Idan Kamara
|
r14004 | except ValueError: | ||
Benoit Boissinot
|
r3233 | timezone = 0 | ||
Matt Mackall
|
r16267 | extra = _defaultextra | ||
Benoit Boissinot
|
r3233 | else: | ||
Matt Mackall
|
r16267 | time, timezone = float(tdata[0]), int(tdata[1]) | ||
extra = decodeextra(tdata[2]) | ||||
mpm@selenic.com
|
r1089 | files = l[3:] | ||
Benoit Boissinot
|
r3233 | return (manifest, user, (time, timezone), files, desc, extra) | ||
mpm@selenic.com
|
r1089 | |||
Martin Geisler
|
r8422 | def add(self, manifest, files, desc, transaction, p1, p2, | ||
Benoit Boissinot
|
r9677 | user, date=None, extra=None): | ||
Martin Geisler
|
r14379 | # Convert to UTF-8 encoded bytestrings as the very first | ||
# thing: calling any method on a localstr object will turn it | ||||
# into a str object and the cached UTF-8 string is thus lost. | ||||
user, desc = encoding.fromlocal(user), encoding.fromlocal(desc) | ||||
Benoit Boissinot
|
r7035 | user = user.strip() | ||
Martin Geisler
|
r8424 | # An empty username or a username with a "\n" will make the | ||
# revision text contain two "\n\n" sequences -> corrupt | ||||
# repository since read cannot unpack the revision. | ||||
if not user: | ||||
raise error.RevlogError(_("empty username")) | ||||
Benoit Boissinot
|
r7035 | if "\n" in user: | ||
Matt Mackall
|
r7633 | raise error.RevlogError(_("username %s contains a newline") | ||
% repr(user)) | ||||
Matt Mackall
|
r8499 | |||
Pierre-Yves David
|
r17810 | desc = stripdesc(desc) | ||
Matt Mackall
|
r8499 | |||
Bryan O'Sullivan
|
r1195 | if date: | ||
Benoit Boissinot
|
r2523 | parseddate = "%d %d" % util.parsedate(date) | ||
Bryan O'Sullivan
|
r1195 | else: | ||
Jose M. Prieto
|
r2522 | parseddate = "%d %d" % util.makedate() | ||
Wagner Bruna
|
r10417 | if extra: | ||
branch = extra.get("branch") | ||||
if branch in ("default", ""): | ||||
del extra["branch"] | ||||
elif branch in (".", "null", "tip"): | ||||
raise error.RevlogError(_('the name \'%s\' is reserved') | ||||
% branch) | ||||
Benoit Boissinot
|
r3233 | if extra: | ||
Martin Geisler
|
r8443 | extra = encodeextra(extra) | ||
Benoit Boissinot
|
r3233 | parseddate = "%s %s" % (parseddate, extra) | ||
Matt Mackall
|
r8209 | l = [hex(manifest), user, parseddate] + sorted(files) + ["", desc] | ||
mpm@selenic.com
|
r1089 | text = "\n".join(l) | ||
Matt Mackall
|
r6750 | return self.addrevision(text, transaction, len(self), p1, p2) | ||
Pierre-Yves David
|
r18306 | |||
def branch(self, rev): | ||||
"""return the branch of a revision | ||||
Mads Kiilerich
|
r18308 | This function exists because creating a changectx object | ||
just to access this is costly.""" | ||||
Pierre-Yves David
|
r18306 | return encoding.tolocal(self.read(rev)[5].get("branch")) | ||