store.py
749 lines
| 21.6 KiB
| text/x-python
|
PythonLexer
/ mercurial / store.py
Adrian Buehlmann
|
r6839 | # store.py - repository store handling for Mercurial | ||
# | ||||
# Copyright 2008 Matt Mackall <mpm@selenic.com> | ||||
# | ||||
Martin Geisler
|
r8225 | # This software may be used and distributed according to the terms of the | ||
Matt Mackall
|
r10263 | # GNU General Public License version 2 or any later version. | ||
Adrian Buehlmann
|
r6839 | |||
Gregory Szorc
|
r27480 | from __future__ import absolute_import | ||
import errno | ||||
Pulkit Goyal
|
r42144 | import functools | ||
Gregory Szorc
|
r27480 | import os | ||
import stat | ||||
from .i18n import _ | ||||
Gregory Szorc
|
r43359 | from .pycompat import getattr | ||
Joerg Sonnenberger
|
r46729 | from .node import hex | ||
Gregory Szorc
|
r27480 | from . import ( | ||
Augie Fackler
|
r43175 | changelog, | ||
Gregory Szorc
|
r27480 | error, | ||
Augie Fackler
|
r43175 | manifest, | ||
Yuya Nishihara
|
r32372 | policy, | ||
Mateusz Kwapich
|
r30077 | pycompat, | ||
Gregory Szorc
|
r27480 | util, | ||
Pierre-Yves David
|
r31234 | vfs as vfsmod, | ||
Gregory Szorc
|
r27480 | ) | ||
Augie Fackler
|
r44517 | from .utils import hashutil | ||
Adrian Buehlmann
|
r6840 | |||
Augie Fackler
|
r43906 | parsers = policy.importmod('parsers') | ||
Pulkit Goyal
|
r42144 | # how much bytes should be read from fncache in one read | ||
# It is done to prevent loading large fncache files into memory | ||||
fncache_chunksize = 10 ** 6 | ||||
Yuya Nishihara
|
r32372 | |||
Augie Fackler
|
r43346 | |||
Pulkit Goyal
|
r40529 | def _matchtrackedpath(path, matcher): | ||
"""parses a fncache entry and returns whether the entry is tracking a path | ||||
matched by matcher or not. | ||||
If matcher is None, returns True""" | ||||
if matcher is None: | ||||
return True | ||||
path = decodedir(path) | ||||
Augie Fackler
|
r43347 | if path.startswith(b'data/'): | ||
return matcher(path[len(b'data/') : -len(b'.i')]) | ||||
elif path.startswith(b'meta/'): | ||||
return matcher.visitdir(path[len(b'meta/') : -len(b'/00manifest.i')]) | ||||
Pulkit Goyal
|
r40529 | |||
Augie Fackler
|
r43347 | raise error.ProgrammingError(b"cannot decode path %s" % path) | ||
Pulkit Goyal
|
r40658 | |||
Augie Fackler
|
r43346 | |||
Benoit Boissinot
|
r8531 | # This avoids a collision between a file named foo and a dir named | ||
# foo.i or foo.d | ||||
Adrian Buehlmann
|
r17607 | def _encodedir(path): | ||
Augie Fackler
|
r46554 | """ | ||
Yuya Nishihara
|
r34133 | >>> _encodedir(b'data/foo.i') | ||
Adrian Buehlmann
|
r13949 | 'data/foo.i' | ||
Yuya Nishihara
|
r34133 | >>> _encodedir(b'data/foo.i/bla.i') | ||
Adrian Buehlmann
|
r13949 | 'data/foo.i.hg/bla.i' | ||
Yuya Nishihara
|
r34133 | >>> _encodedir(b'data/foo.i.hg/bla.i') | ||
Adrian Buehlmann
|
r13949 | 'data/foo.i.hg.hg/bla.i' | ||
Yuya Nishihara
|
r34133 | >>> _encodedir(b'data/foo.i\\ndata/foo.i/bla.i\\ndata/foo.i.hg/bla.i\\n') | ||
Adrian Buehlmann
|
r17605 | 'data/foo.i\\ndata/foo.i.hg/bla.i\\ndata/foo.i.hg.hg/bla.i\\n' | ||
Augie Fackler
|
r46554 | """ | ||
Augie Fackler
|
r43346 | return ( | ||
Augie Fackler
|
r43347 | path.replace(b".hg/", b".hg.hg/") | ||
.replace(b".i/", b".i.hg/") | ||||
.replace(b".d/", b".d.hg/") | ||||
Augie Fackler
|
r43346 | ) | ||
Benoit Boissinot
|
r8531 | |||
Adrian Buehlmann
|
r17607 | encodedir = getattr(parsers, 'encodedir', _encodedir) | ||
Augie Fackler
|
r43346 | |||
Benoit Boissinot
|
r8531 | def decodedir(path): | ||
Augie Fackler
|
r46554 | """ | ||
Yuya Nishihara
|
r34133 | >>> decodedir(b'data/foo.i') | ||
Adrian Buehlmann
|
r13949 | 'data/foo.i' | ||
Yuya Nishihara
|
r34133 | >>> decodedir(b'data/foo.i.hg/bla.i') | ||
Adrian Buehlmann
|
r13949 | 'data/foo.i/bla.i' | ||
Yuya Nishihara
|
r34133 | >>> decodedir(b'data/foo.i.hg.hg/bla.i') | ||
Adrian Buehlmann
|
r13949 | 'data/foo.i.hg/bla.i' | ||
Augie Fackler
|
r46554 | """ | ||
Augie Fackler
|
r43347 | if b".hg/" not in path: | ||
Benoit Boissinot
|
r8531 | return path | ||
Augie Fackler
|
r43346 | return ( | ||
Augie Fackler
|
r43347 | path.replace(b".d.hg/", b".d/") | ||
.replace(b".i.hg/", b".i/") | ||||
.replace(b".hg.hg/", b".hg/") | ||||
Augie Fackler
|
r43346 | ) | ||
Benoit Boissinot
|
r8531 | |||
timeless
|
r29071 | def _reserved(): | ||
Augie Fackler
|
r46554 | """characters that are problematic for filesystems | ||
timeless
|
r29071 | |||
* ascii escapes (0..31) | ||||
* ascii hi (126..255) | ||||
* windows specials | ||||
these characters will be escaped by encodefunctions | ||||
Augie Fackler
|
r46554 | """ | ||
Mateusz Kwapich
|
r30076 | winreserved = [ord(x) for x in u'\\:*?"<>|'] | ||
timeless
|
r29071 | for x in range(32): | ||
yield x | ||||
for x in range(126, 256): | ||||
yield x | ||||
for x in winreserved: | ||||
yield x | ||||
Augie Fackler
|
r43346 | |||
Adrian Buehlmann
|
r6839 | def _buildencodefun(): | ||
Augie Fackler
|
r46554 | """ | ||
Adrian Buehlmann
|
r13949 | >>> enc, dec = _buildencodefun() | ||
Yuya Nishihara
|
r34133 | >>> enc(b'nothing/special.txt') | ||
Adrian Buehlmann
|
r13949 | 'nothing/special.txt' | ||
Yuya Nishihara
|
r34133 | >>> dec(b'nothing/special.txt') | ||
Adrian Buehlmann
|
r13949 | 'nothing/special.txt' | ||
Yuya Nishihara
|
r34133 | >>> enc(b'HELLO') | ||
Adrian Buehlmann
|
r13949 | '_h_e_l_l_o' | ||
Yuya Nishihara
|
r34133 | >>> dec(b'_h_e_l_l_o') | ||
Adrian Buehlmann
|
r13949 | 'HELLO' | ||
Yuya Nishihara
|
r34133 | >>> enc(b'hello:world?') | ||
Adrian Buehlmann
|
r13949 | 'hello~3aworld~3f' | ||
Yuya Nishihara
|
r34133 | >>> dec(b'hello~3aworld~3f') | ||
Adrian Buehlmann
|
r13949 | 'hello:world?' | ||
Yuya Nishihara
|
r34138 | >>> enc(b'the\\x07quick\\xADshot') | ||
Adrian Buehlmann
|
r13949 | 'the~07quick~adshot' | ||
Yuya Nishihara
|
r34133 | >>> dec(b'the~07quick~adshot') | ||
Adrian Buehlmann
|
r13949 | 'the\\x07quick\\xadshot' | ||
Augie Fackler
|
r46554 | """ | ||
Augie Fackler
|
r43347 | e = b'_' | ||
Yuya Nishihara
|
r31253 | xchr = pycompat.bytechr | ||
asciistr = list(map(xchr, range(127))) | ||||
Augie Fackler
|
r43347 | capitals = list(range(ord(b"A"), ord(b"Z") + 1)) | ||
Mateusz Kwapich
|
r30077 | |||
Augie Fackler
|
r44937 | cmap = {x: x for x in asciistr} | ||
timeless
|
r29071 | for x in _reserved(): | ||
Augie Fackler
|
r43347 | cmap[xchr(x)] = b"~%02x" % x | ||
Mateusz Kwapich
|
r30077 | for x in capitals + [ord(e)]: | ||
cmap[xchr(x)] = e + xchr(x).lower() | ||||
Adrian Buehlmann
|
r6839 | dmap = {} | ||
Gregory Szorc
|
r43376 | for k, v in pycompat.iteritems(cmap): | ||
Adrian Buehlmann
|
r6839 | dmap[v] = k | ||
Augie Fackler
|
r43346 | |||
Adrian Buehlmann
|
r6839 | def decode(s): | ||
i = 0 | ||||
while i < len(s): | ||||
Gregory Szorc
|
r38806 | for l in pycompat.xrange(1, 4): | ||
Adrian Buehlmann
|
r6839 | try: | ||
Augie Fackler
|
r43346 | yield dmap[s[i : i + l]] | ||
Adrian Buehlmann
|
r6839 | i += l | ||
break | ||||
except KeyError: | ||||
pass | ||||
else: | ||||
raise KeyError | ||||
Augie Fackler
|
r43346 | |||
return ( | ||||
Augie Fackler
|
r43347 | lambda s: b''.join( | ||
Augie Fackler
|
r43346 | [cmap[s[c : c + 1]] for c in pycompat.xrange(len(s))] | ||
), | ||||
Augie Fackler
|
r43347 | lambda s: b''.join(list(decode(s))), | ||
Augie Fackler
|
r43346 | ) | ||
Adrian Buehlmann
|
r17608 | |||
_encodefname, _decodefname = _buildencodefun() | ||||
Adrian Buehlmann
|
r6839 | |||
Augie Fackler
|
r43346 | |||
Adrian Buehlmann
|
r17608 | def encodefilename(s): | ||
Augie Fackler
|
r46554 | """ | ||
Yuya Nishihara
|
r34133 | >>> encodefilename(b'foo.i/bar.d/bla.hg/hi:world?/HELLO') | ||
Adrian Buehlmann
|
r17608 | 'foo.i.hg/bar.d.hg/bla.hg.hg/hi~3aworld~3f/_h_e_l_l_o' | ||
Augie Fackler
|
r46554 | """ | ||
Adrian Buehlmann
|
r17608 | return _encodefname(encodedir(s)) | ||
Augie Fackler
|
r43346 | |||
Adrian Buehlmann
|
r17608 | def decodefilename(s): | ||
Augie Fackler
|
r46554 | """ | ||
Yuya Nishihara
|
r34133 | >>> decodefilename(b'foo.i.hg/bar.d.hg/bla.hg.hg/hi~3aworld~3f/_h_e_l_l_o') | ||
Adrian Buehlmann
|
r17608 | 'foo.i/bar.d/bla.hg/hi:world?/HELLO' | ||
Augie Fackler
|
r46554 | """ | ||
Adrian Buehlmann
|
r17608 | return decodedir(_decodefname(s)) | ||
Adrian Buehlmann
|
r6839 | |||
Augie Fackler
|
r43346 | |||
Adrian Buehlmann
|
r14288 | def _buildlowerencodefun(): | ||
Augie Fackler
|
r46554 | """ | ||
Adrian Buehlmann
|
r14288 | >>> f = _buildlowerencodefun() | ||
Yuya Nishihara
|
r34133 | >>> f(b'nothing/special.txt') | ||
Adrian Buehlmann
|
r13949 | 'nothing/special.txt' | ||
Yuya Nishihara
|
r34133 | >>> f(b'HELLO') | ||
Adrian Buehlmann
|
r13949 | 'hello' | ||
Yuya Nishihara
|
r34133 | >>> f(b'hello:world?') | ||
Adrian Buehlmann
|
r13949 | 'hello~3aworld~3f' | ||
Yuya Nishihara
|
r34138 | >>> f(b'the\\x07quick\\xADshot') | ||
Adrian Buehlmann
|
r13949 | 'the~07quick~adshot' | ||
Augie Fackler
|
r46554 | """ | ||
Yuya Nishihara
|
r34211 | xchr = pycompat.bytechr | ||
Augie Fackler
|
r44937 | cmap = {xchr(x): xchr(x) for x in pycompat.xrange(127)} | ||
timeless
|
r29071 | for x in _reserved(): | ||
Augie Fackler
|
r43347 | cmap[xchr(x)] = b"~%02x" % x | ||
for x in range(ord(b"A"), ord(b"Z") + 1): | ||||
Yuya Nishihara
|
r34211 | cmap[xchr(x)] = xchr(x).lower() | ||
Augie Fackler
|
r43346 | |||
Yuya Nishihara
|
r34210 | def lowerencode(s): | ||
Augie Fackler
|
r43347 | return b"".join([cmap[c] for c in pycompat.iterbytestr(s)]) | ||
Augie Fackler
|
r43346 | |||
Yuya Nishihara
|
r34210 | return lowerencode | ||
Adrian Buehlmann
|
r7229 | |||
Augie Fackler
|
r43346 | |||
Bryan O'Sullivan
|
r18430 | lowerencode = getattr(parsers, 'lowerencode', None) or _buildlowerencodefun() | ||
Adrian Buehlmann
|
r7229 | |||
Adrian Buehlmann
|
r17570 | # Windows reserved names: con, prn, aux, nul, com1..com9, lpt1..lpt9 | ||
Augie Fackler
|
r43347 | _winres3 = (b'aux', b'con', b'prn', b'nul') # length 3 | ||
_winres4 = (b'com', b'lpt') # length 4 (with trailing 1..9) | ||||
Augie Fackler
|
r43346 | |||
Adrian Buehlmann
|
r12687 | def _auxencode(path, dotencode): | ||
Augie Fackler
|
r46554 | """ | ||
Adrian Buehlmann
|
r13949 | Encodes filenames containing names reserved by Windows or which end in | ||
period or space. Does not touch other single reserved characters c. | ||||
Specifically, c in '\\:*?"<>|' or ord(c) <= 31 are *not* encoded here. | ||||
Additionally encodes space or period at the beginning, if dotencode is | ||||
Adrian Buehlmann
|
r17569 | True. Parameter path is assumed to be all lowercase. | ||
A segment only needs encoding if a reserved name appears as a | ||||
basename (e.g. "aux", "aux.foo"). A directory or file named "foo.aux" | ||||
doesn't need encoding. | ||||
Adrian Buehlmann
|
r13949 | |||
Yuya Nishihara
|
r34133 | >>> s = b'.foo/aux.txt/txt.aux/con/prn/nul/foo.' | ||
>>> _auxencode(s.split(b'/'), True) | ||||
Adrian Buehlmann
|
r17574 | ['~2efoo', 'au~78.txt', 'txt.aux', 'co~6e', 'pr~6e', 'nu~6c', 'foo~2e'] | ||
Yuya Nishihara
|
r34133 | >>> s = b'.com1com2/lpt9.lpt4.lpt1/conprn/com0/lpt0/foo.' | ||
>>> _auxencode(s.split(b'/'), False) | ||||
Adrian Buehlmann
|
r17574 | ['.com1com2', 'lp~749.lpt4.lpt1', 'conprn', 'com0', 'lpt0', 'foo~2e'] | ||
Yuya Nishihara
|
r34133 | >>> _auxencode([b'foo. '], True) | ||
Adrian Buehlmann
|
r17574 | ['foo.~20'] | ||
Yuya Nishihara
|
r34133 | >>> _auxencode([b' .foo'], True) | ||
Adrian Buehlmann
|
r17574 | ['~20.foo'] | ||
Augie Fackler
|
r46554 | """ | ||
Adrian Buehlmann
|
r17589 | for i, n in enumerate(path): | ||
Adrian Buehlmann
|
r17572 | if not n: | ||
continue | ||||
Augie Fackler
|
r43347 | if dotencode and n[0] in b'. ': | ||
n = b"~%02x" % ord(n[0:1]) + n[1:] | ||||
Adrian Buehlmann
|
r17589 | path[i] = n | ||
Adrian Buehlmann
|
r17572 | else: | ||
Augie Fackler
|
r43347 | l = n.find(b'.') | ||
Adrian Buehlmann
|
r17572 | if l == -1: | ||
l = len(n) | ||||
Augie Fackler
|
r43346 | if (l == 3 and n[:3] in _winres3) or ( | ||
Augie Fackler
|
r43347 | l == 4 | ||
and n[3:4] <= b'9' | ||||
and n[3:4] >= b'1' | ||||
and n[:3] in _winres4 | ||||
Augie Fackler
|
r43346 | ): | ||
Adrian Buehlmann
|
r17572 | # encode third letter ('aux' -> 'au~78') | ||
Augie Fackler
|
r43347 | ec = b"~%02x" % ord(n[2:3]) | ||
Adrian Buehlmann
|
r17572 | n = n[0:2] + ec + n[3:] | ||
Adrian Buehlmann
|
r17589 | path[i] = n | ||
Augie Fackler
|
r43347 | if n[-1] in b'. ': | ||
Adrian Buehlmann
|
r17572 | # encode last period or space ('foo...' -> 'foo..~2e') | ||
Augie Fackler
|
r43347 | path[i] = n[:-1] + b"~%02x" % ord(n[-1:]) | ||
Adrian Buehlmann
|
r17589 | return path | ||
Adrian Buehlmann
|
r7229 | |||
Augie Fackler
|
r43346 | |||
Adrian Buehlmann
|
r14288 | _maxstorepathlen = 120 | ||
_dirprefixlen = 8 | ||||
_maxshortdirslen = 8 * (_dirprefixlen + 1) - 4 | ||||
Bryan O'Sullivan
|
r17610 | |||
Augie Fackler
|
r43346 | |||
Bryan O'Sullivan
|
r17610 | def _hashencode(path, dotencode): | ||
Joerg Sonnenberger
|
r46729 | digest = hex(hashutil.sha1(path).digest()) | ||
Augie Fackler
|
r43347 | le = lowerencode(path[5:]).split(b'/') # skips prefix 'data/' or 'meta/' | ||
Bryan O'Sullivan
|
r17610 | parts = _auxencode(le, dotencode) | ||
basename = parts[-1] | ||||
_root, ext = os.path.splitext(basename) | ||||
sdirs = [] | ||||
sdirslen = 0 | ||||
for p in parts[:-1]: | ||||
d = p[:_dirprefixlen] | ||||
Augie Fackler
|
r43347 | if d[-1] in b'. ': | ||
Bryan O'Sullivan
|
r17610 | # Windows can't access dirs ending in period or space | ||
Augie Fackler
|
r43347 | d = d[:-1] + b'_' | ||
Bryan O'Sullivan
|
r17610 | if sdirslen == 0: | ||
t = len(d) | ||||
else: | ||||
t = sdirslen + 1 + len(d) | ||||
if t > _maxshortdirslen: | ||||
break | ||||
sdirs.append(d) | ||||
sdirslen = t | ||||
Augie Fackler
|
r43347 | dirs = b'/'.join(sdirs) | ||
Bryan O'Sullivan
|
r17610 | if len(dirs) > 0: | ||
Augie Fackler
|
r43347 | dirs += b'/' | ||
res = b'dh/' + dirs + digest + ext | ||||
Bryan O'Sullivan
|
r17610 | spaceleft = _maxstorepathlen - len(res) | ||
if spaceleft > 0: | ||||
filler = basename[:spaceleft] | ||||
Augie Fackler
|
r43347 | res = b'dh/' + dirs + filler + digest + ext | ||
Bryan O'Sullivan
|
r17610 | return res | ||
Augie Fackler
|
r43346 | |||
Adrian Buehlmann
|
r17590 | def _hybridencode(path, dotencode): | ||
Augie Fackler
|
r46554 | """encodes path with a length limit | ||
Adrian Buehlmann
|
r7229 | |||
Encodes all paths that begin with 'data/', according to the following. | ||||
Default encoding (reversible): | ||||
Encodes all uppercase letters 'X' as '_x'. All reserved or illegal | ||||
characters are encoded as '~xx', where xx is the two digit hex code | ||||
of the character (see encodefilename). | ||||
Relevant path components consisting of Windows reserved filenames are | ||||
Mads Kiilerich
|
r17738 | masked by encoding the third character ('aux' -> 'au~78', see _auxencode). | ||
Adrian Buehlmann
|
r7229 | |||
Hashed encoding (not reversible): | ||||
Adrian Buehlmann
|
r14288 | If the default-encoded path is longer than _maxstorepathlen, a | ||
Adrian Buehlmann
|
r7229 | non-reversible hybrid hashing of the path is done instead. | ||
Adrian Buehlmann
|
r14288 | This encoding uses up to _dirprefixlen characters of all directory | ||
Adrian Buehlmann
|
r7229 | levels of the lowerencoded path, but not more levels than can fit into | ||
Adrian Buehlmann
|
r14288 | _maxshortdirslen. | ||
Adrian Buehlmann
|
r7229 | Then follows the filler followed by the sha digest of the full path. | ||
The filler is the beginning of the basename of the lowerencoded path | ||||
(the basename is everything after the last path separator). The filler | ||||
is as long as possible, filling in characters from the basename until | ||||
Adrian Buehlmann
|
r14288 | the encoded path has _maxstorepathlen characters (or all chars of the | ||
basename have been taken). | ||||
Adrian Buehlmann
|
r7229 | The extension (e.g. '.i' or '.d') is preserved. | ||
The string 'data/' at the beginning is replaced with 'dh/', if the hashed | ||||
encoding was used. | ||||
Augie Fackler
|
r46554 | """ | ||
Adrian Buehlmann
|
r17609 | path = encodedir(path) | ||
Augie Fackler
|
r43347 | ef = _encodefname(path).split(b'/') | ||
res = b'/'.join(_auxencode(ef, dotencode)) | ||||
Adrian Buehlmann
|
r14288 | if len(res) > _maxstorepathlen: | ||
Bryan O'Sullivan
|
r17610 | res = _hashencode(path, dotencode) | ||
Adrian Buehlmann
|
r7229 | return res | ||
Augie Fackler
|
r43346 | |||
Adrian Buehlmann
|
r17624 | def _pathencode(path): | ||
Bryan O'Sullivan
|
r18435 | de = encodedir(path) | ||
Adrian Buehlmann
|
r17693 | if len(path) > _maxstorepathlen: | ||
Bryan O'Sullivan
|
r18435 | return _hashencode(de, True) | ||
Augie Fackler
|
r43347 | ef = _encodefname(de).split(b'/') | ||
res = b'/'.join(_auxencode(ef, True)) | ||||
Adrian Buehlmann
|
r17624 | if len(res) > _maxstorepathlen: | ||
Bryan O'Sullivan
|
r18435 | return _hashencode(de, True) | ||
Adrian Buehlmann
|
r17624 | return res | ||
Augie Fackler
|
r43346 | |||
Adrian Buehlmann
|
r17624 | _pathencode = getattr(parsers, 'pathencode', _pathencode) | ||
Augie Fackler
|
r43346 | |||
Adrian Buehlmann
|
r17623 | def _plainhybridencode(f): | ||
return _hybridencode(f, False) | ||||
Augie Fackler
|
r43346 | |||
FUJIWARA Katsunori
|
r17726 | def _calcmode(vfs): | ||
Matt Mackall
|
r6898 | try: | ||
# files in .hg/ will be created using this mode | ||||
FUJIWARA Katsunori
|
r17726 | mode = vfs.stat().st_mode | ||
Augie Fackler
|
r43346 | # avoid some useless chmods | ||
Gregory Szorc
|
r25658 | if (0o777 & ~util.umask) == (0o777 & mode): | ||
Matt Mackall
|
r6898 | mode = None | ||
except OSError: | ||||
mode = None | ||||
return mode | ||||
Augie Fackler
|
r43346 | |||
Pulkit Goyal
|
r45911 | _data = [ | ||
b'bookmarks', | ||||
b'narrowspec', | ||||
b'data', | ||||
b'meta', | ||||
b'00manifest.d', | ||||
b'00manifest.i', | ||||
b'00changelog.d', | ||||
b'00changelog.i', | ||||
b'phaseroots', | ||||
b'obsstore', | ||||
Pulkit Goyal
|
r46055 | b'requires', | ||
Pulkit Goyal
|
r45911 | ] | ||
Augie Fackler
|
r43346 | |||
r47100 | REVLOG_FILES_EXT = (b'.i', b'.d', b'.n', b'.nd') | |||
Matt Mackall
|
r6903 | |||
Gregory Szorc
|
r37427 | def isrevlog(f, kind, st): | ||
r47040 | if kind != stat.S_IFREG: | |||
return False | ||||
r47100 | return f.endswith(REVLOG_FILES_EXT) | |||
Gregory Szorc
|
r37427 | |||
Augie Fackler
|
r43346 | |||
Benoit Boissinot
|
r8778 | class basicstore(object): | ||
Adrian Buehlmann
|
r6840 | '''base class for local repository stores''' | ||
Augie Fackler
|
r43346 | |||
FUJIWARA Katsunori
|
r17651 | def __init__(self, path, vfstype): | ||
FUJIWARA Katsunori
|
r17724 | vfs = vfstype(path) | ||
self.path = vfs.base | ||||
FUJIWARA Katsunori
|
r17726 | self.createmode = _calcmode(vfs) | ||
FUJIWARA Katsunori
|
r17652 | vfs.createmode = self.createmode | ||
FUJIWARA Katsunori
|
r17728 | self.rawvfs = vfs | ||
Pierre-Yves David
|
r31234 | self.vfs = vfsmod.filtervfs(vfs, encodedir) | ||
FUJIWARA Katsunori
|
r17653 | self.opener = self.vfs | ||
Adrian Buehlmann
|
r6840 | |||
def join(self, f): | ||||
Augie Fackler
|
r43347 | return self.path + b'/' + encodedir(f) | ||
Adrian Buehlmann
|
r6840 | |||
Gregory Szorc
|
r37427 | def _walk(self, relpath, recurse, filefilter=isrevlog): | ||
Matt Mackall
|
r6900 | '''yields (unencoded, encoded, size)''' | ||
Adrian Buehlmann
|
r13426 | path = self.path | ||
if relpath: | ||||
Augie Fackler
|
r43347 | path += b'/' + relpath | ||
Adrian Buehlmann
|
r13426 | striplen = len(self.path) + 1 | ||
Matt Mackall
|
r6899 | l = [] | ||
FUJIWARA Katsunori
|
r17728 | if self.rawvfs.isdir(path): | ||
Matt Mackall
|
r6899 | visit = [path] | ||
FUJIWARA Katsunori
|
r17747 | readdir = self.rawvfs.readdir | ||
Matt Mackall
|
r6899 | while visit: | ||
p = visit.pop() | ||||
FUJIWARA Katsunori
|
r17747 | for f, kind, st in readdir(p, stat=True): | ||
Augie Fackler
|
r43347 | fp = p + b'/' + f | ||
Gregory Szorc
|
r37427 | if filefilter(f, kind, st): | ||
Matt Mackall
|
r6900 | n = util.pconvert(fp[striplen:]) | ||
Benoit Boissinot
|
r8531 | l.append((decodedir(n), n, st.st_size)) | ||
Matt Mackall
|
r6899 | elif kind == stat.S_IFDIR and recurse: | ||
visit.append(fp) | ||||
Bryan O'Sullivan
|
r17054 | l.sort() | ||
return l | ||||
Adrian Buehlmann
|
r6840 | |||
Augie Fackler
|
r43175 | def changelog(self, trypending): | ||
return changelog.changelog(self.vfs, trypending=trypending) | ||||
def manifestlog(self, repo, storenarrowmatch): | ||||
rootstore = manifest.manifestrevlog(self.vfs) | ||||
Augie Fackler
|
r43346 | return manifest.manifestlog(self.vfs, repo, rootstore, storenarrowmatch) | ||
Augie Fackler
|
r43175 | |||
Pulkit Goyal
|
r40376 | def datafiles(self, matcher=None): | ||
Augie Fackler
|
r43347 | return self._walk(b'data', True) + self._walk(b'meta', True) | ||
Adrian Buehlmann
|
r6840 | |||
Durham Goode
|
r19177 | def topfiles(self): | ||
# yield manifest before changelog | ||||
Augie Fackler
|
r43347 | return reversed(self._walk(b'', False)) | ||
Durham Goode
|
r19177 | |||
Pulkit Goyal
|
r40376 | def walk(self, matcher=None): | ||
Augie Fackler
|
r46554 | """yields (unencoded, encoded, size) | ||
Pulkit Goyal
|
r40376 | |||
if a matcher is passed, storage files of only those tracked paths | ||||
are passed with matches the matcher | ||||
Augie Fackler
|
r46554 | """ | ||
Adrian Buehlmann
|
r6840 | # yield data files first | ||
Pulkit Goyal
|
r40376 | for x in self.datafiles(matcher): | ||
Adrian Buehlmann
|
r6840 | yield x | ||
Durham Goode
|
r19177 | for x in self.topfiles(): | ||
Adrian Buehlmann
|
r6840 | yield x | ||
Matt Mackall
|
r6903 | def copylist(self): | ||
Pulkit Goyal
|
r46055 | return _data | ||
Matt Mackall
|
r6903 | |||
Durham Goode
|
r20883 | def write(self, tr): | ||
Adrian Buehlmann
|
r13391 | pass | ||
Durham Goode
|
r20884 | def invalidatecaches(self): | ||
pass | ||||
Durham Goode
|
r20885 | def markremoved(self, fn): | ||
pass | ||||
smuralid
|
r17744 | def __contains__(self, path): | ||
'''Checks if the store contains path''' | ||||
Augie Fackler
|
r43347 | path = b"/".join((b"data", path)) | ||
smuralid
|
r17744 | # file? | ||
Augie Fackler
|
r43347 | if self.vfs.exists(path + b".i"): | ||
smuralid
|
r17744 | return True | ||
# dir? | ||||
Augie Fackler
|
r43347 | if not path.endswith(b"/"): | ||
path = path + b"/" | ||||
FUJIWARA Katsunori
|
r19903 | return self.vfs.exists(path) | ||
smuralid
|
r17744 | |||
Augie Fackler
|
r43346 | |||
Matt Mackall
|
r6898 | class encodedstore(basicstore): | ||
FUJIWARA Katsunori
|
r17651 | def __init__(self, path, vfstype): | ||
Augie Fackler
|
r43347 | vfs = vfstype(path + b'/store') | ||
FUJIWARA Katsunori
|
r17724 | self.path = vfs.base | ||
FUJIWARA Katsunori
|
r17726 | self.createmode = _calcmode(vfs) | ||
FUJIWARA Katsunori
|
r17652 | vfs.createmode = self.createmode | ||
FUJIWARA Katsunori
|
r17728 | self.rawvfs = vfs | ||
Pierre-Yves David
|
r31234 | self.vfs = vfsmod.filtervfs(vfs, encodefilename) | ||
FUJIWARA Katsunori
|
r17653 | self.opener = self.vfs | ||
Adrian Buehlmann
|
r6840 | |||
Pulkit Goyal
|
r40376 | def datafiles(self, matcher=None): | ||
Martin von Zweigbergk
|
r28007 | for a, b, size in super(encodedstore, self).datafiles(): | ||
Adrian Buehlmann
|
r6892 | try: | ||
Matt Mackall
|
r6900 | a = decodefilename(a) | ||
Adrian Buehlmann
|
r6892 | except KeyError: | ||
Matt Mackall
|
r6900 | a = None | ||
Yuya Nishihara
|
r40620 | if a is not None and not _matchtrackedpath(a, matcher): | ||
continue | ||||
Matt Mackall
|
r6900 | yield a, b, size | ||
Adrian Buehlmann
|
r6840 | |||
def join(self, f): | ||||
Augie Fackler
|
r43347 | return self.path + b'/' + encodefilename(f) | ||
Adrian Buehlmann
|
r6840 | |||
Matt Mackall
|
r6903 | def copylist(self): | ||
Pulkit Goyal
|
r45911 | return [b'requires', b'00changelog.i'] + [b'store/' + f for f in _data] | ||
Augie Fackler
|
r43346 | |||
Matt Mackall
|
r6903 | |||
Benoit Boissinot
|
r8530 | class fncache(object): | ||
Benoit Boissinot
|
r8531 | # the filename used to be partially encoded | ||
# hence the encodedir/decodedir dance | ||||
FUJIWARA Katsunori
|
r17722 | def __init__(self, vfs): | ||
self.vfs = vfs | ||||
Adrian Buehlmann
|
r7229 | self.entries = None | ||
Adrian Buehlmann
|
r13391 | self._dirty = False | ||
Pulkit Goyal
|
r40767 | # set of new additions to fncache | ||
self.addls = set() | ||||
Adrian Buehlmann
|
r7229 | |||
Valentin Gatien-Baron
|
r42960 | def ensureloaded(self, warn=None): | ||
Augie Fackler
|
r46554 | """read the fncache file if not already read. | ||
Valentin Gatien-Baron
|
r42960 | |||
If the file on disk is corrupted, raise. If warn is provided, | ||||
Augie Fackler
|
r46554 | warn and keep going instead.""" | ||
Valentin Gatien-Baron
|
r42960 | if self.entries is None: | ||
self._load(warn) | ||||
def _load(self, warn=None): | ||||
Benoit Boissinot
|
r8530 | '''fill the entries from the fncache file''' | ||
Adrian Buehlmann
|
r13391 | self._dirty = False | ||
Benoit Boissinot
|
r8530 | try: | ||
Augie Fackler
|
r43347 | fp = self.vfs(b'fncache', mode=b'rb') | ||
Benoit Boissinot
|
r8530 | except IOError: | ||
# skip nonexistent file | ||||
Bryan O'Sullivan
|
r16404 | self.entries = set() | ||
Benoit Boissinot
|
r8530 | return | ||
Pulkit Goyal
|
r42144 | |||
self.entries = set() | ||||
chunk = b'' | ||||
for c in iter(functools.partial(fp.read, fncache_chunksize), b''): | ||||
chunk += c | ||||
try: | ||||
p = chunk.rindex(b'\n') | ||||
Augie Fackler
|
r43346 | self.entries.update(decodedir(chunk[: p + 1]).splitlines()) | ||
chunk = chunk[p + 1 :] | ||||
Pulkit Goyal
|
r42144 | except ValueError: | ||
# substring '\n' not found, maybe the entry is bigger than the | ||||
# chunksize, so let's keep iterating | ||||
pass | ||||
Pulkit Goyal
|
r42147 | if chunk: | ||
Augie Fackler
|
r43347 | msg = _(b"fncache does not ends with a newline") | ||
Valentin Gatien-Baron
|
r42960 | if warn: | ||
Augie Fackler
|
r43347 | warn(msg + b'\n') | ||
Valentin Gatien-Baron
|
r42960 | else: | ||
Augie Fackler
|
r43346 | raise error.Abort( | ||
msg, | ||||
hint=_( | ||||
Augie Fackler
|
r43347 | b"use 'hg debugrebuildfncache' to " | ||
b"rebuild the fncache" | ||||
Augie Fackler
|
r43346 | ), | ||
) | ||||
Valentin Gatien-Baron
|
r42960 | self._checkentries(fp, warn) | ||
Pulkit Goyal
|
r42139 | fp.close() | ||
Valentin Gatien-Baron
|
r42960 | def _checkentries(self, fp, warn): | ||
Pulkit Goyal
|
r42139 | """ make sure there is no empty string in entries """ | ||
Augie Fackler
|
r43347 | if b'' in self.entries: | ||
Bryan O'Sullivan
|
r16404 | fp.seek(0) | ||
Jun Wu
|
r30398 | for n, line in enumerate(util.iterfile(fp)): | ||
Augie Fackler
|
r43347 | if not line.rstrip(b'\n'): | ||
t = _(b'invalid entry in fncache, line %d') % (n + 1) | ||||
Valentin Gatien-Baron
|
r42960 | if warn: | ||
Augie Fackler
|
r43347 | warn(t + b'\n') | ||
Valentin Gatien-Baron
|
r42960 | else: | ||
raise error.Abort(t) | ||||
Adrian Buehlmann
|
r7229 | |||
Durham Goode
|
r20883 | def write(self, tr): | ||
Bryan O'Sullivan
|
r16404 | if self._dirty: | ||
Boris Feld
|
r38718 | assert self.entries is not None | ||
Pulkit Goyal
|
r40779 | self.entries = self.entries | self.addls | ||
self.addls = set() | ||||
Augie Fackler
|
r43347 | tr.addbackup(b'fncache') | ||
fp = self.vfs(b'fncache', mode=b'wb', atomictemp=True) | ||||
Durham Goode
|
r20879 | if self.entries: | ||
Augie Fackler
|
r43347 | fp.write(encodedir(b'\n'.join(self.entries) + b'\n')) | ||
Durham Goode
|
r20879 | fp.close() | ||
self._dirty = False | ||||
Pulkit Goyal
|
r40767 | if self.addls: | ||
# if we have just new entries, let's append them to the fncache | ||||
Augie Fackler
|
r43347 | tr.addbackup(b'fncache') | ||
fp = self.vfs(b'fncache', mode=b'ab', atomictemp=True) | ||||
Pulkit Goyal
|
r40767 | if self.addls: | ||
Augie Fackler
|
r43347 | fp.write(encodedir(b'\n'.join(self.addls) + b'\n')) | ||
Pulkit Goyal
|
r40767 | fp.close() | ||
self.entries = None | ||||
self.addls = set() | ||||
Benoit Boissinot
|
r8530 | |||
def add(self, fn): | ||||
if self.entries is None: | ||||
self._load() | ||||
Adrian Buehlmann
|
r10577 | if fn not in self.entries: | ||
Pulkit Goyal
|
r40767 | self.addls.add(fn) | ||
Benoit Boissinot
|
r8530 | |||
Durham Goode
|
r20885 | def remove(self, fn): | ||
if self.entries is None: | ||||
self._load() | ||||
Pulkit Goyal
|
r40767 | if fn in self.addls: | ||
self.addls.remove(fn) | ||||
return | ||||
Durham Goode
|
r20885 | try: | ||
self.entries.remove(fn) | ||||
self._dirty = True | ||||
except KeyError: | ||||
pass | ||||
Adrian Buehlmann
|
r17782 | def __contains__(self, fn): | ||
Pulkit Goyal
|
r40767 | if fn in self.addls: | ||
return True | ||||
Benoit Boissinot
|
r8530 | if self.entries is None: | ||
self._load() | ||||
Adrian Buehlmann
|
r17782 | return fn in self.entries | ||
Benoit Boissinot
|
r8530 | |||
def __iter__(self): | ||||
if self.entries is None: | ||||
self._load() | ||||
Pulkit Goyal
|
r40767 | return iter(self.entries | self.addls) | ||
Adrian Buehlmann
|
r7229 | |||
Augie Fackler
|
r43346 | |||
Boris Feld
|
r41125 | class _fncachevfs(vfsmod.proxyvfs): | ||
FUJIWARA Katsunori
|
r17721 | def __init__(self, vfs, fnc, encode): | ||
Yuya Nishihara
|
r33412 | vfsmod.proxyvfs.__init__(self, vfs) | ||
Adrian Buehlmann
|
r14194 | self.fncache = fnc | ||
self.encode = encode | ||||
Augie Fackler
|
r43347 | def __call__(self, path, mode=b'r', *args, **kw): | ||
Martijn Pieters
|
r38683 | encoded = self.encode(path) | ||
Augie Fackler
|
r43347 | if mode not in (b'r', b'rb') and ( | ||
path.startswith(b'data/') or path.startswith(b'meta/') | ||||
Augie Fackler
|
r43346 | ): | ||
Martijn Pieters
|
r38683 | # do not trigger a fncache load when adding a file that already is | ||
# known to exist. | ||||
notload = self.fncache.entries is None and self.vfs.exists(encoded) | ||||
Augie Fackler
|
r43347 | if notload and b'a' in mode and not self.vfs.stat(encoded).st_size: | ||
Martijn Pieters
|
r38683 | # when appending to an existing file, if the file has size zero, | ||
# it should be considered as missing. Such zero-size files are | ||||
# the result of truncation when a transaction is aborted. | ||||
notload = False | ||||
if not notload: | ||||
self.fncache.add(path) | ||||
return self.vfs(encoded, mode, *args, **kw) | ||||
Adrian Buehlmann
|
r14194 | |||
FUJIWARA Katsunori
|
r17725 | def join(self, path): | ||
if path: | ||||
return self.vfs.join(self.encode(path)) | ||||
else: | ||||
return self.vfs.join(path) | ||||
Augie Fackler
|
r43346 | |||
Adrian Buehlmann
|
r7229 | class fncachestore(basicstore): | ||
FUJIWARA Katsunori
|
r17651 | def __init__(self, path, vfstype, dotencode): | ||
Adrian Buehlmann
|
r17591 | if dotencode: | ||
Bryan O'Sullivan
|
r18435 | encode = _pathencode | ||
Adrian Buehlmann
|
r17591 | else: | ||
encode = _plainhybridencode | ||||
Adrian Buehlmann
|
r12687 | self.encode = encode | ||
Augie Fackler
|
r43347 | vfs = vfstype(path + b'/store') | ||
FUJIWARA Katsunori
|
r17724 | self.path = vfs.base | ||
Augie Fackler
|
r43347 | self.pathsep = self.path + b'/' | ||
FUJIWARA Katsunori
|
r17726 | self.createmode = _calcmode(vfs) | ||
FUJIWARA Katsunori
|
r17652 | vfs.createmode = self.createmode | ||
FUJIWARA Katsunori
|
r17727 | self.rawvfs = vfs | ||
FUJIWARA Katsunori
|
r17652 | fnc = fncache(vfs) | ||
Simon Heimberg
|
r9133 | self.fncache = fnc | ||
FUJIWARA Katsunori
|
r17653 | self.vfs = _fncachevfs(vfs, fnc, encode) | ||
self.opener = self.vfs | ||||
Adrian Buehlmann
|
r7229 | |||
def join(self, f): | ||||
Bryan O'Sullivan
|
r17562 | return self.pathsep + self.encode(f) | ||
Adrian Buehlmann
|
r7229 | |||
Matt Mackall
|
r17731 | def getsize(self, path): | ||
return self.rawvfs.stat(path).st_size | ||||
Pulkit Goyal
|
r40376 | def datafiles(self, matcher=None): | ||
Bryan O'Sullivan
|
r17373 | for f in sorted(self.fncache): | ||
Pulkit Goyal
|
r40529 | if not _matchtrackedpath(f, matcher): | ||
continue | ||||
Adrian Buehlmann
|
r12687 | ef = self.encode(f) | ||
Adrian Buehlmann
|
r7229 | try: | ||
Matt Mackall
|
r17731 | yield f, ef, self.getsize(ef) | ||
Gregory Szorc
|
r25660 | except OSError as err: | ||
Bryan O'Sullivan
|
r17374 | if err.errno != errno.ENOENT: | ||
raise | ||||
Adrian Buehlmann
|
r7229 | |||
def copylist(self): | ||||
Augie Fackler
|
r43346 | d = ( | ||
Pulkit Goyal
|
r45911 | b'bookmarks', | ||
b'narrowspec', | ||||
b'data', | ||||
b'meta', | ||||
b'dh', | ||||
b'fncache', | ||||
b'phaseroots', | ||||
b'obsstore', | ||||
b'00manifest.d', | ||||
b'00manifest.i', | ||||
b'00changelog.d', | ||||
b'00changelog.i', | ||||
Pulkit Goyal
|
r46055 | b'requires', | ||
Augie Fackler
|
r43346 | ) | ||
Pulkit Goyal
|
r45911 | return [b'requires', b'00changelog.i'] + [b'store/' + f for f in d] | ||
Adrian Buehlmann
|
r7229 | |||
Durham Goode
|
r20883 | def write(self, tr): | ||
self.fncache.write(tr) | ||||
Adrian Buehlmann
|
r13391 | |||
Durham Goode
|
r20884 | def invalidatecaches(self): | ||
self.fncache.entries = None | ||||
Pulkit Goyal
|
r40767 | self.fncache.addls = set() | ||
Durham Goode
|
r20884 | |||
Durham Goode
|
r20885 | def markremoved(self, fn): | ||
self.fncache.remove(fn) | ||||
Adrian Buehlmann
|
r17783 | def _exists(self, f): | ||
ef = self.encode(f) | ||||
try: | ||||
self.getsize(ef) | ||||
return True | ||||
Gregory Szorc
|
r25660 | except OSError as err: | ||
Adrian Buehlmann
|
r17783 | if err.errno != errno.ENOENT: | ||
raise | ||||
# nonexistent entry | ||||
return False | ||||
smuralid
|
r17745 | def __contains__(self, path): | ||
'''Checks if the store contains path''' | ||||
Augie Fackler
|
r43347 | path = b"/".join((b"data", path)) | ||
Adrian Buehlmann
|
r17782 | # check for files (exact match) | ||
Augie Fackler
|
r43347 | e = path + b'.i' | ||
Adrian Buehlmann
|
r17784 | if e in self.fncache and self._exists(e): | ||
Adrian Buehlmann
|
r17782 | return True | ||
# now check for directories (prefix match) | ||||
Augie Fackler
|
r43347 | if not path.endswith(b'/'): | ||
path += b'/' | ||||
Adrian Buehlmann
|
r17782 | for e in self.fncache: | ||
Adrian Buehlmann
|
r17784 | if e.startswith(path) and self._exists(e): | ||
Adrian Buehlmann
|
r17782 | return True | ||
return False | ||||