##// END OF EJS Templates
tracing: add support for emitting counters...
tracing: add support for emitting counters Differential Revision: https://phab.mercurial-scm.org/D6526

File last commit:

r42528:27d6956d default
r42677:e658ac39 default
Show More
store.py
654 lines | 20.3 KiB | text/x-python | PythonLexer
Adrian Buehlmann
move filename encoding functions from util.py to new store.py
r6839 # store.py - repository store handling for Mercurial
#
# Copyright 2008 Matt Mackall <mpm@selenic.com>
#
Martin Geisler
updated license to be explicit about GPL version 2
r8225 # This software may be used and distributed according to the terms of the
Matt Mackall
Update license to GPLv2+
r10263 # GNU General Public License version 2 or any later version.
Adrian Buehlmann
move filename encoding functions from util.py to new store.py
r6839
Gregory Szorc
store: use absolute_import
r27480 from __future__ import absolute_import
import errno
Pulkit Goyal
store: don't read the whole fncache in memory...
r42144 import functools
Augie Fackler
store: use hashlib.sha1 directly instead of through util...
r29338 import hashlib
Gregory Szorc
store: use absolute_import
r27480 import os
import stat
from .i18n import _
from . import (
error,
Pulkit Goyal
py3: use node.hex(h.digest()) instead of h.hexdigest()...
r35600 node,
Yuya Nishihara
parsers: switch to policy importer...
r32372 policy,
Mateusz Kwapich
py3: make encodefun in store.py compatible with py3k...
r30077 pycompat,
Gregory Szorc
store: use absolute_import
r27480 util,
Pierre-Yves David
vfs: use 'vfs' module directly in 'mercurial.store'...
r31234 vfs as vfsmod,
Gregory Szorc
store: use absolute_import
r27480 )
Adrian Buehlmann
introduce store classes...
r6840
Yuya Nishihara
parsers: switch to policy importer...
r32372 parsers = policy.importmod(r'parsers')
Pulkit Goyal
store: don't read the whole fncache in memory...
r42144 # how much bytes should be read from fncache in one read
# It is done to prevent loading large fncache files into memory
fncache_chunksize = 10 ** 6
Yuya Nishihara
parsers: switch to policy importer...
r32372
Pulkit Goyal
store: introduce _matchtrackedpath() and use it to filter store files...
r40529 def _matchtrackedpath(path, matcher):
"""parses a fncache entry and returns whether the entry is tracking a path
matched by matcher or not.
If matcher is None, returns True"""
if matcher is None:
return True
path = decodedir(path)
if path.startswith('data/'):
return matcher(path[len('data/'):-len('.i')])
elif path.startswith('meta/'):
Martin von Zweigbergk
match: use '' instead of '.' for root directory (API)...
r42528 return matcher.visitdir(path[len('meta/'):-len('/00manifest.i')])
Pulkit Goyal
store: introduce _matchtrackedpath() and use it to filter store files...
r40529
Pulkit Goyal
store: raise ProgrammingError if unable to decode a storage path...
r40658 raise error.ProgrammingError("cannot decode path %s" % path)
Benoit Boissinot
filelog encoding: move the encoding/decoding into store...
r8531 # This avoids a collision between a file named foo and a dir named
# foo.i or foo.d
Adrian Buehlmann
store: use fast C implementation of encodedir() if it's available...
r17607 def _encodedir(path):
Adrian Buehlmann
store: add some doctests
r13949 '''
Yuya Nishihara
doctest: bulk-replace string literals with b'' for Python 3...
r34133 >>> _encodedir(b'data/foo.i')
Adrian Buehlmann
store: add some doctests
r13949 'data/foo.i'
Yuya Nishihara
doctest: bulk-replace string literals with b'' for Python 3...
r34133 >>> _encodedir(b'data/foo.i/bla.i')
Adrian Buehlmann
store: add some doctests
r13949 'data/foo.i.hg/bla.i'
Yuya Nishihara
doctest: bulk-replace string literals with b'' for Python 3...
r34133 >>> _encodedir(b'data/foo.i.hg/bla.i')
Adrian Buehlmann
store: add some doctests
r13949 'data/foo.i.hg.hg/bla.i'
Yuya Nishihara
doctest: bulk-replace string literals with b'' for Python 3...
r34133 >>> _encodedir(b'data/foo.i\\ndata/foo.i/bla.i\\ndata/foo.i.hg/bla.i\\n')
Adrian Buehlmann
store: add multiline doctest case for encodedir()...
r17605 'data/foo.i\\ndata/foo.i.hg/bla.i\\ndata/foo.i.hg.hg/bla.i\\n'
Adrian Buehlmann
store: add some doctests
r13949 '''
Benoit Boissinot
filelog encoding: move the encoding/decoding into store...
r8531 return (path
.replace(".hg/", ".hg.hg/")
.replace(".i/", ".i.hg/")
.replace(".d/", ".d.hg/"))
Adrian Buehlmann
store: use fast C implementation of encodedir() if it's available...
r17607 encodedir = getattr(parsers, 'encodedir', _encodedir)
Benoit Boissinot
filelog encoding: move the encoding/decoding into store...
r8531 def decodedir(path):
Adrian Buehlmann
store: add some doctests
r13949 '''
Yuya Nishihara
doctest: bulk-replace string literals with b'' for Python 3...
r34133 >>> decodedir(b'data/foo.i')
Adrian Buehlmann
store: add some doctests
r13949 'data/foo.i'
Yuya Nishihara
doctest: bulk-replace string literals with b'' for Python 3...
r34133 >>> decodedir(b'data/foo.i.hg/bla.i')
Adrian Buehlmann
store: add some doctests
r13949 'data/foo.i/bla.i'
Yuya Nishihara
doctest: bulk-replace string literals with b'' for Python 3...
r34133 >>> decodedir(b'data/foo.i.hg.hg/bla.i')
Adrian Buehlmann
store: add some doctests
r13949 'data/foo.i.hg/bla.i'
'''
Adrian Buehlmann
store: remove uneeded startswith('data/') checks in encodedir() and decodedir()...
r17586 if ".hg/" not in path:
Benoit Boissinot
filelog encoding: move the encoding/decoding into store...
r8531 return path
return (path
.replace(".d.hg/", ".d/")
.replace(".i.hg/", ".i/")
.replace(".hg.hg/", ".hg/"))
timeless
store: treat range as a generator instead of a list for py3 compat
r29071 def _reserved():
''' characters that are problematic for filesystems
* ascii escapes (0..31)
* ascii hi (126..255)
* windows specials
these characters will be escaped by encodefunctions
'''
Mateusz Kwapich
py3: make the string unicode so its iterable in py3k
r30076 winreserved = [ord(x) for x in u'\\:*?"<>|']
timeless
store: treat range as a generator instead of a list for py3 compat
r29071 for x in range(32):
yield x
for x in range(126, 256):
yield x
for x in winreserved:
yield x
Adrian Buehlmann
move filename encoding functions from util.py to new store.py
r6839 def _buildencodefun():
Adrian Buehlmann
store: add some doctests
r13949 '''
>>> enc, dec = _buildencodefun()
Yuya Nishihara
doctest: bulk-replace string literals with b'' for Python 3...
r34133 >>> enc(b'nothing/special.txt')
Adrian Buehlmann
store: add some doctests
r13949 'nothing/special.txt'
Yuya Nishihara
doctest: bulk-replace string literals with b'' for Python 3...
r34133 >>> dec(b'nothing/special.txt')
Adrian Buehlmann
store: add some doctests
r13949 'nothing/special.txt'
Yuya Nishihara
doctest: bulk-replace string literals with b'' for Python 3...
r34133 >>> enc(b'HELLO')
Adrian Buehlmann
store: add some doctests
r13949 '_h_e_l_l_o'
Yuya Nishihara
doctest: bulk-replace string literals with b'' for Python 3...
r34133 >>> dec(b'_h_e_l_l_o')
Adrian Buehlmann
store: add some doctests
r13949 'HELLO'
Yuya Nishihara
doctest: bulk-replace string literals with b'' for Python 3...
r34133 >>> enc(b'hello:world?')
Adrian Buehlmann
store: add some doctests
r13949 'hello~3aworld~3f'
Yuya Nishihara
doctest: bulk-replace string literals with b'' for Python 3...
r34133 >>> dec(b'hello~3aworld~3f')
Adrian Buehlmann
store: add some doctests
r13949 'hello:world?'
Yuya Nishihara
doctest: do not embed non-ascii characters in docstring...
r34138 >>> enc(b'the\\x07quick\\xADshot')
Adrian Buehlmann
store: add some doctests
r13949 'the~07quick~adshot'
Yuya Nishihara
doctest: bulk-replace string literals with b'' for Python 3...
r34133 >>> dec(b'the~07quick~adshot')
Adrian Buehlmann
store: add some doctests
r13949 'the\\x07quick\\xadshot'
'''
Adrian Buehlmann
move filename encoding functions from util.py to new store.py
r6839 e = '_'
Yuya Nishihara
py3: factor out bytechr() function...
r31253 xchr = pycompat.bytechr
asciistr = list(map(xchr, range(127)))
Mateusz Kwapich
py3: make encodefun in store.py compatible with py3k...
r30077 capitals = list(range(ord("A"), ord("Z") + 1))
Martijn Pieters
store: py26 compat, don't use a dict comprehension
r30108 cmap = dict((x, x) for x in asciistr)
timeless
store: treat range as a generator instead of a list for py3 compat
r29071 for x in _reserved():
Mateusz Kwapich
py3: make encodefun in store.py compatible with py3k...
r30077 cmap[xchr(x)] = "~%02x" % x
for x in capitals + [ord(e)]:
cmap[xchr(x)] = e + xchr(x).lower()
Adrian Buehlmann
move filename encoding functions from util.py to new store.py
r6839 dmap = {}
for k, v in cmap.iteritems():
dmap[v] = k
def decode(s):
i = 0
while i < len(s):
Gregory Szorc
global: use pycompat.xrange()...
r38806 for l in pycompat.xrange(1, 4):
Adrian Buehlmann
move filename encoding functions from util.py to new store.py
r6839 try:
Matt Mackall
many, many trivial check-code fixups
r10282 yield dmap[s[i:i + l]]
Adrian Buehlmann
move filename encoding functions from util.py to new store.py
r6839 i += l
break
except KeyError:
pass
else:
raise KeyError
Gregory Szorc
global: use pycompat.xrange()...
r38806 return (lambda s: ''.join([cmap[s[c:c + 1]]
for c in pycompat.xrange(len(s))]),
Adrian Buehlmann
store: extract functions _encodefname and _decodefname
r17608 lambda s: ''.join(list(decode(s))))
_encodefname, _decodefname = _buildencodefun()
Adrian Buehlmann
move filename encoding functions from util.py to new store.py
r6839
Adrian Buehlmann
store: extract functions _encodefname and _decodefname
r17608 def encodefilename(s):
'''
Yuya Nishihara
doctest: bulk-replace string literals with b'' for Python 3...
r34133 >>> encodefilename(b'foo.i/bar.d/bla.hg/hi:world?/HELLO')
Adrian Buehlmann
store: extract functions _encodefname and _decodefname
r17608 'foo.i.hg/bar.d.hg/bla.hg.hg/hi~3aworld~3f/_h_e_l_l_o'
'''
return _encodefname(encodedir(s))
def decodefilename(s):
'''
Yuya Nishihara
doctest: bulk-replace string literals with b'' for Python 3...
r34133 >>> decodefilename(b'foo.i.hg/bar.d.hg/bla.hg.hg/hi~3aworld~3f/_h_e_l_l_o')
Adrian Buehlmann
store: extract functions _encodefname and _decodefname
r17608 'foo.i/bar.d/bla.hg/hi:world?/HELLO'
'''
return decodedir(_decodefname(s))
Adrian Buehlmann
move filename encoding functions from util.py to new store.py
r6839
Adrian Buehlmann
store: change names to comply with project coding standards...
r14288 def _buildlowerencodefun():
Adrian Buehlmann
store: add some doctests
r13949 '''
Adrian Buehlmann
store: change names to comply with project coding standards...
r14288 >>> f = _buildlowerencodefun()
Yuya Nishihara
doctest: bulk-replace string literals with b'' for Python 3...
r34133 >>> f(b'nothing/special.txt')
Adrian Buehlmann
store: add some doctests
r13949 'nothing/special.txt'
Yuya Nishihara
doctest: bulk-replace string literals with b'' for Python 3...
r34133 >>> f(b'HELLO')
Adrian Buehlmann
store: add some doctests
r13949 'hello'
Yuya Nishihara
doctest: bulk-replace string literals with b'' for Python 3...
r34133 >>> f(b'hello:world?')
Adrian Buehlmann
store: add some doctests
r13949 'hello~3aworld~3f'
Yuya Nishihara
doctest: do not embed non-ascii characters in docstring...
r34138 >>> f(b'the\\x07quick\\xADshot')
Adrian Buehlmann
store: add some doctests
r13949 'the~07quick~adshot'
'''
Yuya Nishihara
py3: use bytechr() in store._buildlowerencodefun()
r34211 xchr = pycompat.bytechr
Gregory Szorc
global: use pycompat.xrange()...
r38806 cmap = dict([(xchr(x), xchr(x)) for x in pycompat.xrange(127)])
timeless
store: treat range as a generator instead of a list for py3 compat
r29071 for x in _reserved():
Yuya Nishihara
py3: use bytechr() in store._buildlowerencodefun()
r34211 cmap[xchr(x)] = "~%02x" % x
Mads Kiilerich
check-code: there must also be whitespace between ')' and operator...
r18054 for x in range(ord("A"), ord("Z") + 1):
Yuya Nishihara
py3: use bytechr() in store._buildlowerencodefun()
r34211 cmap[xchr(x)] = xchr(x).lower()
Yuya Nishihara
store: give name to lowerencode function...
r34210 def lowerencode(s):
Yuya Nishihara
py3: iterate bytes as a byte string in store.lowerencode()
r34212 return "".join([cmap[c] for c in pycompat.iterbytestr(s)])
Yuya Nishihara
store: give name to lowerencode function...
r34210 return lowerencode
Adrian Buehlmann
introduce fncache repository layout...
r7229
Bryan O'Sullivan
store: implement lowerencode in C
r18430 lowerencode = getattr(parsers, 'lowerencode', None) or _buildlowerencodefun()
Adrian Buehlmann
introduce fncache repository layout...
r7229
Adrian Buehlmann
store: optimze _auxencode() a bit by grouping the reserved names by length...
r17570 # Windows reserved names: con, prn, aux, nul, com1..com9, lpt1..lpt9
_winres3 = ('aux', 'con', 'prn', 'nul') # length 3
_winres4 = ('com', 'lpt') # length 4 (with trailing 1..9)
Adrian Buehlmann
store: encode first period or space in filenames (issue1713)...
r12687 def _auxencode(path, dotencode):
Adrian Buehlmann
store: add some doctests
r13949 '''
Encodes filenames containing names reserved by Windows or which end in
period or space. Does not touch other single reserved characters c.
Specifically, c in '\\:*?"<>|' or ord(c) <= 31 are *not* encoded here.
Additionally encodes space or period at the beginning, if dotencode is
Adrian Buehlmann
store: explain "aux.foo" versus "foo.aux" in doc of _auxencode()
r17569 True. Parameter path is assumed to be all lowercase.
A segment only needs encoding if a reserved name appears as a
basename (e.g. "aux", "aux.foo"). A directory or file named "foo.aux"
doesn't need encoding.
Adrian Buehlmann
store: add some doctests
r13949
Yuya Nishihara
doctest: bulk-replace string literals with b'' for Python 3...
r34133 >>> s = b'.foo/aux.txt/txt.aux/con/prn/nul/foo.'
>>> _auxencode(s.split(b'/'), True)
Adrian Buehlmann
store: let _auxencode() return the list of path segments...
r17574 ['~2efoo', 'au~78.txt', 'txt.aux', 'co~6e', 'pr~6e', 'nu~6c', 'foo~2e']
Yuya Nishihara
doctest: bulk-replace string literals with b'' for Python 3...
r34133 >>> s = b'.com1com2/lpt9.lpt4.lpt1/conprn/com0/lpt0/foo.'
>>> _auxencode(s.split(b'/'), False)
Adrian Buehlmann
store: let _auxencode() return the list of path segments...
r17574 ['.com1com2', 'lp~749.lpt4.lpt1', 'conprn', 'com0', 'lpt0', 'foo~2e']
Yuya Nishihara
doctest: bulk-replace string literals with b'' for Python 3...
r34133 >>> _auxencode([b'foo. '], True)
Adrian Buehlmann
store: let _auxencode() return the list of path segments...
r17574 ['foo.~20']
Yuya Nishihara
doctest: bulk-replace string literals with b'' for Python 3...
r34133 >>> _auxencode([b' .foo'], True)
Adrian Buehlmann
store: let _auxencode() return the list of path segments...
r17574 ['~20.foo']
Adrian Buehlmann
store: add some doctests
r13949 '''
Adrian Buehlmann
store: parameter path of _auxencode is now a list of strings
r17589 for i, n in enumerate(path):
Adrian Buehlmann
store: unindent most of the contents of the for loop in _auxencode()...
r17572 if not n:
continue
if dotencode and n[0] in '. ':
Augie Fackler
store: fix many single-byte ops to use slicing in _auxencode
r31362 n = "~%02x" % ord(n[0:1]) + n[1:]
Adrian Buehlmann
store: parameter path of _auxencode is now a list of strings
r17589 path[i] = n
Adrian Buehlmann
store: unindent most of the contents of the for loop in _auxencode()...
r17572 else:
l = n.find('.')
if l == -1:
l = len(n)
if ((l == 3 and n[:3] in _winres3) or
Augie Fackler
store: fix many single-byte ops to use slicing in _auxencode
r31362 (l == 4 and n[3:4] <= '9' and n[3:4] >= '1'
Adrian Buehlmann
store: unindent most of the contents of the for loop in _auxencode()...
r17572 and n[:3] in _winres4)):
# encode third letter ('aux' -> 'au~78')
Augie Fackler
store: fix many single-byte ops to use slicing in _auxencode
r31362 ec = "~%02x" % ord(n[2:3])
Adrian Buehlmann
store: unindent most of the contents of the for loop in _auxencode()...
r17572 n = n[0:2] + ec + n[3:]
Adrian Buehlmann
store: parameter path of _auxencode is now a list of strings
r17589 path[i] = n
Adrian Buehlmann
store: unindent most of the contents of the for loop in _auxencode()...
r17572 if n[-1] in '. ':
# encode last period or space ('foo...' -> 'foo..~2e')
Augie Fackler
store: fix many single-byte ops to use slicing in _auxencode
r31362 path[i] = n[:-1] + "~%02x" % ord(n[-1:])
Adrian Buehlmann
store: parameter path of _auxencode is now a list of strings
r17589 return path
Adrian Buehlmann
introduce fncache repository layout...
r7229
Adrian Buehlmann
store: change names to comply with project coding standards...
r14288 _maxstorepathlen = 120
_dirprefixlen = 8
_maxshortdirslen = 8 * (_dirprefixlen + 1) - 4
Bryan O'Sullivan
store: refactor hashed encoding into its own function
r17610
def _hashencode(path, dotencode):
Pulkit Goyal
py3: use node.hex(h.digest()) instead of h.hexdigest()...
r35600 digest = node.hex(hashlib.sha1(path).digest())
Martin von Zweigbergk
treemanifest: store submanifest revlog per directory...
r25091 le = lowerencode(path[5:]).split('/') # skips prefix 'data/' or 'meta/'
Bryan O'Sullivan
store: refactor hashed encoding into its own function
r17610 parts = _auxencode(le, dotencode)
basename = parts[-1]
_root, ext = os.path.splitext(basename)
sdirs = []
sdirslen = 0
for p in parts[:-1]:
d = p[:_dirprefixlen]
if d[-1] in '. ':
# Windows can't access dirs ending in period or space
d = d[:-1] + '_'
if sdirslen == 0:
t = len(d)
else:
t = sdirslen + 1 + len(d)
if t > _maxshortdirslen:
break
sdirs.append(d)
sdirslen = t
dirs = '/'.join(sdirs)
if len(dirs) > 0:
dirs += '/'
res = 'dh/' + dirs + digest + ext
spaceleft = _maxstorepathlen - len(res)
if spaceleft > 0:
filler = basename[:spaceleft]
res = 'dh/' + dirs + filler + digest + ext
return res
Adrian Buehlmann
store: eliminate one level of lambda functions on _hybridencode
r17590 def _hybridencode(path, dotencode):
Adrian Buehlmann
introduce fncache repository layout...
r7229 '''encodes path with a length limit
Encodes all paths that begin with 'data/', according to the following.
Default encoding (reversible):
Encodes all uppercase letters 'X' as '_x'. All reserved or illegal
characters are encoded as '~xx', where xx is the two digit hex code
of the character (see encodefilename).
Relevant path components consisting of Windows reserved filenames are
Mads Kiilerich
spelling: fix minor spell checker issues
r17738 masked by encoding the third character ('aux' -> 'au~78', see _auxencode).
Adrian Buehlmann
introduce fncache repository layout...
r7229
Hashed encoding (not reversible):
Adrian Buehlmann
store: change names to comply with project coding standards...
r14288 If the default-encoded path is longer than _maxstorepathlen, a
Adrian Buehlmann
introduce fncache repository layout...
r7229 non-reversible hybrid hashing of the path is done instead.
Adrian Buehlmann
store: change names to comply with project coding standards...
r14288 This encoding uses up to _dirprefixlen characters of all directory
Adrian Buehlmann
introduce fncache repository layout...
r7229 levels of the lowerencoded path, but not more levels than can fit into
Adrian Buehlmann
store: change names to comply with project coding standards...
r14288 _maxshortdirslen.
Adrian Buehlmann
introduce fncache repository layout...
r7229 Then follows the filler followed by the sha digest of the full path.
The filler is the beginning of the basename of the lowerencoded path
(the basename is everything after the last path separator). The filler
is as long as possible, filling in characters from the basename until
Adrian Buehlmann
store: change names to comply with project coding standards...
r14288 the encoded path has _maxstorepathlen characters (or all chars of the
basename have been taken).
Adrian Buehlmann
introduce fncache repository layout...
r7229 The extension (e.g. '.i' or '.d') is preserved.
The string 'data/' at the beginning is replaced with 'dh/', if the hashed
encoding was used.
'''
Adrian Buehlmann
store: reuse direncoded path in _hybridencode...
r17609 path = encodedir(path)
ef = _encodefname(path).split('/')
Adrian Buehlmann
store: eliminate one level of lambda functions on _hybridencode
r17590 res = '/'.join(_auxencode(ef, dotencode))
Adrian Buehlmann
store: change names to comply with project coding standards...
r14288 if len(res) > _maxstorepathlen:
Bryan O'Sullivan
store: refactor hashed encoding into its own function
r17610 res = _hashencode(path, dotencode)
Adrian Buehlmann
introduce fncache repository layout...
r7229 return res
Adrian Buehlmann
store: add a fallback _pathencode Python function...
r17624 def _pathencode(path):
Bryan O'Sullivan
store: switch to C-based hashed path encoding
r18435 de = encodedir(path)
Adrian Buehlmann
store: optimize _pathencode by checking the length of the unencoded path...
r17693 if len(path) > _maxstorepathlen:
Bryan O'Sullivan
store: switch to C-based hashed path encoding
r18435 return _hashencode(de, True)
ef = _encodefname(de).split('/')
Adrian Buehlmann
store: add a fallback _pathencode Python function...
r17624 res = '/'.join(_auxencode(ef, True))
if len(res) > _maxstorepathlen:
Bryan O'Sullivan
store: switch to C-based hashed path encoding
r18435 return _hashencode(de, True)
Adrian Buehlmann
store: add a fallback _pathencode Python function...
r17624 return res
_pathencode = getattr(parsers, 'pathencode', _pathencode)
Adrian Buehlmann
store: move _plainhybridencode and _dothybridencode higher up in the file...
r17623 def _plainhybridencode(f):
return _hybridencode(f, False)
FUJIWARA Katsunori
store: invoke "os.stat()" for "createmode" initialization via vfs...
r17726 def _calcmode(vfs):
Matt Mackall
store: simplify class hierarchy
r6898 try:
# files in .hg/ will be created using this mode
FUJIWARA Katsunori
store: invoke "os.stat()" for "createmode" initialization via vfs...
r17726 mode = vfs.stat().st_mode
Matt Mackall
store: simplify class hierarchy
r6898 # avoid some useless chmods
Gregory Szorc
global: mass rewrite to use modern octal syntax...
r25658 if (0o777 & ~util.umask) == (0o777 & mode):
Matt Mackall
store: simplify class hierarchy
r6898 mode = None
except OSError:
mode = None
return mode
Martin von Zweigbergk
bookmarks: keep bookmarks in .hg/store if new config set...
r42512 _data = ('bookmarks narrowspec data meta 00manifest.d 00manifest.i'
Martin von Zweigbergk
narrow: move .hg/narrowspec to .hg/store/narrowspec (BC)...
r38908 ' 00changelog.d 00changelog.i phaseroots obsstore')
Matt Mackall
clone: get a list of files to clone from store
r6903
Gregory Szorc
store: make file filtering during walk configurable...
r37427 def isrevlog(f, kind, st):
return kind == stat.S_IFREG and f[-2:] in ('.i', '.d')
Benoit Boissinot
use new style classes
r8778 class basicstore(object):
Adrian Buehlmann
introduce store classes...
r6840 '''base class for local repository stores'''
FUJIWARA Katsunori
store: rename "openertype" argument to "vfstype"
r17651 def __init__(self, path, vfstype):
FUJIWARA Katsunori
store: initialize vfs field first to use it for initialization of others...
r17724 vfs = vfstype(path)
self.path = vfs.base
FUJIWARA Katsunori
store: invoke "os.stat()" for "createmode" initialization via vfs...
r17726 self.createmode = _calcmode(vfs)
FUJIWARA Katsunori
store: rename "op" variables to "vfs"
r17652 vfs.createmode = self.createmode
FUJIWARA Katsunori
store: invoke "os.path.isdir()" via vfs...
r17728 self.rawvfs = vfs
Pierre-Yves David
vfs: use 'vfs' module directly in 'mercurial.store'...
r31234 self.vfs = vfsmod.filtervfs(vfs, encodedir)
FUJIWARA Katsunori
store: initialize "vfs" fields by "vfs" constructors...
r17653 self.opener = self.vfs
Adrian Buehlmann
introduce store classes...
r6840
def join(self, f):
Adrian Buehlmann
store: remove pointless pathjoiner parameter...
r13426 return self.path + '/' + encodedir(f)
Adrian Buehlmann
introduce store classes...
r6840
Gregory Szorc
store: make file filtering during walk configurable...
r37427 def _walk(self, relpath, recurse, filefilter=isrevlog):
Matt Mackall
store: change handling of decoding errors
r6900 '''yields (unencoded, encoded, size)'''
Adrian Buehlmann
store: remove pointless pathjoiner parameter...
r13426 path = self.path
if relpath:
path += '/' + relpath
striplen = len(self.path) + 1
Matt Mackall
store: simplify walking...
r6899 l = []
FUJIWARA Katsunori
store: invoke "os.path.isdir()" via vfs...
r17728 if self.rawvfs.isdir(path):
Matt Mackall
store: simplify walking...
r6899 visit = [path]
FUJIWARA Katsunori
store: invoke "osutil.listdir()" via vfs...
r17747 readdir = self.rawvfs.readdir
Matt Mackall
store: simplify walking...
r6899 while visit:
p = visit.pop()
FUJIWARA Katsunori
store: invoke "osutil.listdir()" via vfs...
r17747 for f, kind, st in readdir(p, stat=True):
Adrian Buehlmann
store: remove pointless pathjoiner parameter...
r13426 fp = p + '/' + f
Gregory Szorc
store: make file filtering during walk configurable...
r37427 if filefilter(f, kind, st):
Matt Mackall
store: change handling of decoding errors
r6900 n = util.pconvert(fp[striplen:])
Benoit Boissinot
filelog encoding: move the encoding/decoding into store...
r8531 l.append((decodedir(n), n, st.st_size))
Matt Mackall
store: simplify walking...
r6899 elif kind == stat.S_IFDIR and recurse:
visit.append(fp)
Bryan O'Sullivan
store: sort filenames in place
r17054 l.sort()
return l
Adrian Buehlmann
introduce store classes...
r6840
Pulkit Goyal
store: pass matcher to store.datafiles()...
r40376 def datafiles(self, matcher=None):
Martin von Zweigbergk
treemanifests: fix streaming clone...
r28007 return self._walk('data', True) + self._walk('meta', True)
Adrian Buehlmann
introduce store classes...
r6840
Durham Goode
store: move top file walk to a separate function...
r19177 def topfiles(self):
# yield manifest before changelog
return reversed(self._walk('', False))
Pulkit Goyal
store: pass matcher to store.datafiles()...
r40376 def walk(self, matcher=None):
'''yields (unencoded, encoded, size)
if a matcher is passed, storage files of only those tracked paths
are passed with matches the matcher
'''
Adrian Buehlmann
introduce store classes...
r6840 # yield data files first
Pulkit Goyal
store: pass matcher to store.datafiles()...
r40376 for x in self.datafiles(matcher):
Adrian Buehlmann
introduce store classes...
r6840 yield x
Durham Goode
store: move top file walk to a separate function...
r19177 for x in self.topfiles():
Adrian Buehlmann
introduce store classes...
r6840 yield x
Matt Mackall
clone: get a list of files to clone from store
r6903 def copylist(self):
return ['requires'] + _data.split()
Durham Goode
fncache: move fncache writing to be in a transaction...
r20883 def write(self, tr):
Adrian Buehlmann
fncachestore: defer updating the fncache file to a single file open...
r13391 pass
Durham Goode
caches: invalidate store caches when lock is taken...
r20884 def invalidatecaches(self):
pass
Durham Goode
fncache: clean up fncache during strips...
r20885 def markremoved(self, fn):
pass
smuralid
store: add a contains method to basicstore...
r17744 def __contains__(self, path):
'''Checks if the store contains path'''
path = "/".join(("data", path))
# file?
FUJIWARA Katsunori
store: use "vfs.exists()" instead of "os.path.exists()"
r19903 if self.vfs.exists(path + ".i"):
smuralid
store: add a contains method to basicstore...
r17744 return True
# dir?
if not path.endswith("/"):
path = path + "/"
FUJIWARA Katsunori
store: use "vfs.exists()" instead of "os.path.exists()"
r19903 return self.vfs.exists(path)
smuralid
store: add a contains method to basicstore...
r17744
Matt Mackall
store: simplify class hierarchy
r6898 class encodedstore(basicstore):
FUJIWARA Katsunori
store: rename "openertype" argument to "vfstype"
r17651 def __init__(self, path, vfstype):
FUJIWARA Katsunori
store: initialize vfs field first to use it for initialization of others...
r17724 vfs = vfstype(path + '/store')
self.path = vfs.base
FUJIWARA Katsunori
store: invoke "os.stat()" for "createmode" initialization via vfs...
r17726 self.createmode = _calcmode(vfs)
FUJIWARA Katsunori
store: rename "op" variables to "vfs"
r17652 vfs.createmode = self.createmode
FUJIWARA Katsunori
store: invoke "os.path.isdir()" via vfs...
r17728 self.rawvfs = vfs
Pierre-Yves David
vfs: use 'vfs' module directly in 'mercurial.store'...
r31234 self.vfs = vfsmod.filtervfs(vfs, encodefilename)
FUJIWARA Katsunori
store: initialize "vfs" fields by "vfs" constructors...
r17653 self.opener = self.vfs
Adrian Buehlmann
introduce store classes...
r6840
Pulkit Goyal
store: pass matcher to store.datafiles()...
r40376 def datafiles(self, matcher=None):
Martin von Zweigbergk
treemanifests: fix streaming clone...
r28007 for a, b, size in super(encodedstore, self).datafiles():
Adrian Buehlmann
verify: check repo.store
r6892 try:
Matt Mackall
store: change handling of decoding errors
r6900 a = decodefilename(a)
Adrian Buehlmann
verify: check repo.store
r6892 except KeyError:
Matt Mackall
store: change handling of decoding errors
r6900 a = None
Yuya Nishihara
store: pass in decoded filename to narrow matcher
r40620 if a is not None and not _matchtrackedpath(a, matcher):
continue
Matt Mackall
store: change handling of decoding errors
r6900 yield a, b, size
Adrian Buehlmann
introduce store classes...
r6840
def join(self, f):
Adrian Buehlmann
store: remove pointless pathjoiner parameter...
r13426 return self.path + '/' + encodefilename(f)
Adrian Buehlmann
introduce store classes...
r6840
Matt Mackall
clone: get a list of files to clone from store
r6903 def copylist(self):
return (['requires', '00changelog.i'] +
Adrian Buehlmann
store: remove pointless pathjoiner parameter...
r13426 ['store/' + f for f in _data.split()])
Matt Mackall
clone: get a list of files to clone from store
r6903
Benoit Boissinot
store: refactor the fncache handling...
r8530 class fncache(object):
Benoit Boissinot
filelog encoding: move the encoding/decoding into store...
r8531 # the filename used to be partially encoded
# hence the encodedir/decodedir dance
FUJIWARA Katsunori
store: rename field name from "opener" to "vfs" in internal classes for fncache...
r17722 def __init__(self, vfs):
self.vfs = vfs
Adrian Buehlmann
introduce fncache repository layout...
r7229 self.entries = None
Adrian Buehlmann
fncachestore: defer updating the fncache file to a single file open...
r13391 self._dirty = False
Pulkit Goyal
store: append to fncache if there are only new files to write...
r40767 # set of new additions to fncache
self.addls = set()
Adrian Buehlmann
introduce fncache repository layout...
r7229
Benoit Boissinot
store: refactor the fncache handling...
r8530 def _load(self):
'''fill the entries from the fncache file'''
Adrian Buehlmann
fncachestore: defer updating the fncache file to a single file open...
r13391 self._dirty = False
Benoit Boissinot
store: refactor the fncache handling...
r8530 try:
FUJIWARA Katsunori
store: rename field name from "opener" to "vfs" in internal classes for fncache...
r17722 fp = self.vfs('fncache', mode='rb')
Benoit Boissinot
store: refactor the fncache handling...
r8530 except IOError:
# skip nonexistent file
Bryan O'Sullivan
store: speed up read and write of large fncache files...
r16404 self.entries = set()
Benoit Boissinot
store: refactor the fncache handling...
r8530 return
Pulkit Goyal
store: don't read the whole fncache in memory...
r42144
self.entries = set()
chunk = b''
for c in iter(functools.partial(fp.read, fncache_chunksize), b''):
chunk += c
try:
p = chunk.rindex(b'\n')
self.entries.update(decodedir(chunk[:p + 1]).splitlines())
chunk = chunk[p + 1:]
except ValueError:
# substring '\n' not found, maybe the entry is bigger than the
# chunksize, so let's keep iterating
pass
Pulkit Goyal
store: error out if fncache does not ends with a newline...
r42147 if chunk:
Pulkit Goyal
store: recommend using `hg debugrebuildfncache` is fncache is corrupted...
r42156 raise error.Abort(_("fncache does not ends with a newline"),
hint=_("use 'hg debugrebuildfncache' to rebuild"
" the fncache"))
Pulkit Goyal
store: move logic to check for invalid entry in fncache to own function...
r42139 self._checkentries(fp)
fp.close()
def _checkentries(self, fp):
""" make sure there is no empty string in entries """
Bryan O'Sullivan
store: speed up read and write of large fncache files...
r16404 if '' in self.entries:
fp.seek(0)
Jun Wu
store: migrate to util.iterfile
r30398 for n, line in enumerate(util.iterfile(fp)):
Bryan O'Sullivan
store: speed up read and write of large fncache files...
r16404 if not line.rstrip('\n'):
timeless@mozdev.org
l10n: use %d instead of %s for numbers
r26778 t = _('invalid entry in fncache, line %d') % (n + 1)
Pierre-Yves David
error: get Abort from 'error' instead of 'util'...
r26587 raise error.Abort(t)
Adrian Buehlmann
introduce fncache repository layout...
r7229
Durham Goode
fncache: move fncache writing to be in a transaction...
r20883 def write(self, tr):
Bryan O'Sullivan
store: speed up read and write of large fncache files...
r16404 if self._dirty:
Boris Feld
store: assert the fncache have been loaded if dirty...
r38718 assert self.entries is not None
Pulkit Goyal
store: write fncache only once if there are both adds and removes...
r40779 self.entries = self.entries | self.addls
self.addls = set()
Durham Goode
fncache: move fncache writing to be in a transaction...
r20883 tr.addbackup('fncache')
Durham Goode
fncache: remove the rewriting logic...
r20879 fp = self.vfs('fncache', mode='wb', atomictemp=True)
if self.entries:
fp.write(encodedir('\n'.join(self.entries) + '\n'))
fp.close()
self._dirty = False
Pulkit Goyal
store: append to fncache if there are only new files to write...
r40767 if self.addls:
# if we have just new entries, let's append them to the fncache
tr.addbackup('fncache')
fp = self.vfs('fncache', mode='ab', atomictemp=True)
if self.addls:
fp.write(encodedir('\n'.join(self.addls) + '\n'))
fp.close()
self.entries = None
self.addls = set()
Benoit Boissinot
store: refactor the fncache handling...
r8530
def add(self, fn):
if self.entries is None:
self._load()
Adrian Buehlmann
store: only add new entries to the fncache file...
r10577 if fn not in self.entries:
Pulkit Goyal
store: append to fncache if there are only new files to write...
r40767 self.addls.add(fn)
Benoit Boissinot
store: refactor the fncache handling...
r8530
Durham Goode
fncache: clean up fncache during strips...
r20885 def remove(self, fn):
if self.entries is None:
self._load()
Pulkit Goyal
store: append to fncache if there are only new files to write...
r40767 if fn in self.addls:
self.addls.remove(fn)
return
Durham Goode
fncache: clean up fncache during strips...
r20885 try:
self.entries.remove(fn)
self._dirty = True
except KeyError:
pass
Adrian Buehlmann
store: move __contains__() implementation from class fncache into fncachestore...
r17782 def __contains__(self, fn):
Pulkit Goyal
store: append to fncache if there are only new files to write...
r40767 if fn in self.addls:
return True
Benoit Boissinot
store: refactor the fncache handling...
r8530 if self.entries is None:
self._load()
Adrian Buehlmann
store: move __contains__() implementation from class fncache into fncachestore...
r17782 return fn in self.entries
Benoit Boissinot
store: refactor the fncache handling...
r8530
def __iter__(self):
if self.entries is None:
self._load()
Pulkit Goyal
store: append to fncache if there are only new files to write...
r40767 return iter(self.entries | self.addls)
Adrian Buehlmann
introduce fncache repository layout...
r7229
Boris Feld
vfs: fix proxyvfs inheritance...
r41125 class _fncachevfs(vfsmod.proxyvfs):
FUJIWARA Katsunori
store: rename argument name from "op"(ener) to "vfs"
r17721 def __init__(self, vfs, fnc, encode):
Yuya Nishihara
vfs: rename auditvfs to proxyvfs...
r33412 vfsmod.proxyvfs.__init__(self, vfs)
Adrian Buehlmann
store: break up reference cycle introduced in 9cbff8a39a2a...
r14194 self.fncache = fnc
self.encode = encode
def __call__(self, path, mode='r', *args, **kw):
Martijn Pieters
fncache: avoid loading the filename cache when not actually modifying it...
r38683 encoded = self.encode(path)
Martin von Zweigbergk
treemanifests: fix streaming clone...
r28007 if mode not in ('r', 'rb') and (path.startswith('data/') or
path.startswith('meta/')):
Martijn Pieters
fncache: avoid loading the filename cache when not actually modifying it...
r38683 # do not trigger a fncache load when adding a file that already is
# known to exist.
notload = self.fncache.entries is None and self.vfs.exists(encoded)
if notload and 'a' in mode and not self.vfs.stat(encoded).st_size:
# when appending to an existing file, if the file has size zero,
# it should be considered as missing. Such zero-size files are
# the result of truncation when a transaction is aborted.
notload = False
if not notload:
self.fncache.add(path)
return self.vfs(encoded, mode, *args, **kw)
Adrian Buehlmann
store: break up reference cycle introduced in 9cbff8a39a2a...
r14194
FUJIWARA Katsunori
vfs: define "join()" in each classes derived from "abstractvfs"...
r17725 def join(self, path):
if path:
return self.vfs.join(self.encode(path))
else:
return self.vfs.join(path)
Adrian Buehlmann
introduce fncache repository layout...
r7229 class fncachestore(basicstore):
FUJIWARA Katsunori
store: rename "openertype" argument to "vfstype"
r17651 def __init__(self, path, vfstype, dotencode):
Adrian Buehlmann
store: move encode lambda logic into fncachestore...
r17591 if dotencode:
Bryan O'Sullivan
store: switch to C-based hashed path encoding
r18435 encode = _pathencode
Adrian Buehlmann
store: move encode lambda logic into fncachestore...
r17591 else:
encode = _plainhybridencode
Adrian Buehlmann
store: encode first period or space in filenames (issue1713)...
r12687 self.encode = encode
FUJIWARA Katsunori
store: initialize vfs field first to use it for initialization of others...
r17724 vfs = vfstype(path + '/store')
self.path = vfs.base
Bryan O'Sullivan
store: reduce string concatenation when joining...
r17562 self.pathsep = self.path + '/'
FUJIWARA Katsunori
store: invoke "os.stat()" for "createmode" initialization via vfs...
r17726 self.createmode = _calcmode(vfs)
FUJIWARA Katsunori
store: rename "op" variables to "vfs"
r17652 vfs.createmode = self.createmode
FUJIWARA Katsunori
store: replace invocation of "getsize()" by "vfs.stat()"...
r17727 self.rawvfs = vfs
FUJIWARA Katsunori
store: rename "op" variables to "vfs"
r17652 fnc = fncache(vfs)
Simon Heimberg
store: eliminate reference cycle in fncachestore...
r9133 self.fncache = fnc
FUJIWARA Katsunori
store: initialize "vfs" fields by "vfs" constructors...
r17653 self.vfs = _fncachevfs(vfs, fnc, encode)
self.opener = self.vfs
Adrian Buehlmann
introduce fncache repository layout...
r7229
def join(self, f):
Bryan O'Sullivan
store: reduce string concatenation when joining...
r17562 return self.pathsep + self.encode(f)
Adrian Buehlmann
introduce fncache repository layout...
r7229
Matt Mackall
store: restore getsize method...
r17731 def getsize(self, path):
return self.rawvfs.stat(path).st_size
Pulkit Goyal
store: pass matcher to store.datafiles()...
r40376 def datafiles(self, matcher=None):
Bryan O'Sullivan
store: sort the results of fncachestore.datafiles()
r17373 for f in sorted(self.fncache):
Pulkit Goyal
store: introduce _matchtrackedpath() and use it to filter store files...
r40529 if not _matchtrackedpath(f, matcher):
continue
Adrian Buehlmann
store: encode first period or space in filenames (issue1713)...
r12687 ef = self.encode(f)
Adrian Buehlmann
introduce fncache repository layout...
r7229 try:
Matt Mackall
store: restore getsize method...
r17731 yield f, ef, self.getsize(ef)
Gregory Szorc
global: mass rewrite to use modern exception syntax...
r25660 except OSError as err:
Bryan O'Sullivan
store: only one kind of OSError means "nonexistent entry"
r17374 if err.errno != errno.ENOENT:
raise
Adrian Buehlmann
introduce fncache repository layout...
r7229
def copylist(self):
Martin von Zweigbergk
bookmarks: keep bookmarks in .hg/store if new config set...
r42512 d = ('bookmarks narrowspec data meta dh fncache phaseroots obsstore'
Pierre-Yves David
phases: prevent rebase to rebase immutable changeset.
r15742 ' 00manifest.d 00manifest.i 00changelog.d 00changelog.i')
Adrian Buehlmann
introduce fncache repository layout...
r7229 return (['requires', '00changelog.i'] +
Adrian Buehlmann
store: remove pointless pathjoiner parameter...
r13426 ['store/' + f for f in d.split()])
Adrian Buehlmann
introduce fncache repository layout...
r7229
Durham Goode
fncache: move fncache writing to be in a transaction...
r20883 def write(self, tr):
self.fncache.write(tr)
Adrian Buehlmann
fncachestore: defer updating the fncache file to a single file open...
r13391
Durham Goode
caches: invalidate store caches when lock is taken...
r20884 def invalidatecaches(self):
self.fncache.entries = None
Pulkit Goyal
store: append to fncache if there are only new files to write...
r40767 self.fncache.addls = set()
Durham Goode
caches: invalidate store caches when lock is taken...
r20884
Durham Goode
fncache: clean up fncache during strips...
r20885 def markremoved(self, fn):
self.fncache.remove(fn)
Adrian Buehlmann
store: add new _exists helper function on fncachestore
r17783 def _exists(self, f):
ef = self.encode(f)
try:
self.getsize(ef)
return True
Gregory Szorc
global: mass rewrite to use modern exception syntax...
r25660 except OSError as err:
Adrian Buehlmann
store: add new _exists helper function on fncachestore
r17783 if err.errno != errno.ENOENT:
raise
# nonexistent entry
return False
smuralid
store: add a contains method to fncachestore...
r17745 def __contains__(self, path):
'''Checks if the store contains path'''
path = "/".join(("data", path))
Adrian Buehlmann
store: move __contains__() implementation from class fncache into fncachestore...
r17782 # check for files (exact match)
Adrian Buehlmann
store: fncache may contain non-existent entries (fixes b9a56b816ff2)
r17784 e = path + '.i'
if e in self.fncache and self._exists(e):
Adrian Buehlmann
store: move __contains__() implementation from class fncache into fncachestore...
r17782 return True
# now check for directories (prefix match)
if not path.endswith('/'):
path += '/'
for e in self.fncache:
Adrian Buehlmann
store: fncache may contain non-existent entries (fixes b9a56b816ff2)
r17784 if e.startswith(path) and self._exists(e):
Adrian Buehlmann
store: move __contains__() implementation from class fncache into fncachestore...
r17782 return True
return False