##// END OF EJS Templates
hgweb: remove dead code handling UnicodeDecodeError...
hgweb: remove dead code handling UnicodeDecodeError I’m quite confident that the error can’t happen on Python 3, as the main motivation for separating bytes and str in Python 3 was to avoid this class of errors.

File last commit:

r49801:642e31cb default
r50178:44b26349 default
Show More
store.py
849 lines | 25.2 KiB | text/x-python | PythonLexer
Adrian Buehlmann
move filename encoding functions from util.py to new store.py
r6839 # store.py - repository store handling for Mercurial
#
Raphaël Gomès
contributor: change mentions of mpm to olivia...
r47575 # Copyright 2008 Olivia Mackall <olivia@selenic.com>
Adrian Buehlmann
move filename encoding functions from util.py to new store.py
r6839 #
Martin Geisler
updated license to be explicit about GPL version 2
r8225 # This software may be used and distributed according to the terms of the
Matt Mackall
Update license to GPLv2+
r10263 # GNU General Public License version 2 or any later version.
Adrian Buehlmann
move filename encoding functions from util.py to new store.py
r6839
Gregory Szorc
store: use absolute_import
r27480
import errno
Pulkit Goyal
store: don't read the whole fncache in memory...
r42144 import functools
Gregory Szorc
store: use absolute_import
r27480 import os
store: exclude `undo.` nodemap's file from `walk`...
r47752 import re
Gregory Szorc
store: use absolute_import
r27480 import stat
from .i18n import _
Gregory Szorc
py3: manually import getattr where it is needed...
r43359 from .pycompat import getattr
Joerg Sonnenberger
node: import symbols explicitly...
r46729 from .node import hex
Gregory Szorc
store: use absolute_import
r27480 from . import (
Augie Fackler
localrepo: push manifestlog and changelog construction code into store...
r43175 changelog,
Gregory Szorc
store: use absolute_import
r27480 error,
Augie Fackler
localrepo: push manifestlog and changelog construction code into store...
r43175 manifest,
Yuya Nishihara
parsers: switch to policy importer...
r32372 policy,
Mateusz Kwapich
py3: make encodefun in store.py compatible with py3k...
r30077 pycompat,
Gregory Szorc
store: use absolute_import
r27480 util,
Pierre-Yves David
vfs: use 'vfs' module directly in 'mercurial.store'...
r31234 vfs as vfsmod,
Gregory Szorc
store: use absolute_import
r27480 )
Augie Fackler
core: migrate uses of hashlib.sha1 to hashutil.sha1...
r44517 from .utils import hashutil
Adrian Buehlmann
introduce store classes...
r6840
Augie Fackler
cleanup: remove pointless r-prefixes on single-quoted strings...
r43906 parsers = policy.importmod('parsers')
Pulkit Goyal
store: don't read the whole fncache in memory...
r42144 # how much bytes should be read from fncache in one read
# It is done to prevent loading large fncache files into memory
fncache_chunksize = 10 ** 6
Yuya Nishihara
parsers: switch to policy importer...
r32372
Augie Fackler
formatting: blacken the codebase...
r43346
Pulkit Goyal
store: introduce _matchtrackedpath() and use it to filter store files...
r40529 def _matchtrackedpath(path, matcher):
"""parses a fncache entry and returns whether the entry is tracking a path
matched by matcher or not.
If matcher is None, returns True"""
if matcher is None:
return True
path = decodedir(path)
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 if path.startswith(b'data/'):
return matcher(path[len(b'data/') : -len(b'.i')])
elif path.startswith(b'meta/'):
return matcher.visitdir(path[len(b'meta/') : -len(b'/00manifest.i')])
Pulkit Goyal
store: introduce _matchtrackedpath() and use it to filter store files...
r40529
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 raise error.ProgrammingError(b"cannot decode path %s" % path)
Pulkit Goyal
store: raise ProgrammingError if unable to decode a storage path...
r40658
Augie Fackler
formatting: blacken the codebase...
r43346
Benoit Boissinot
filelog encoding: move the encoding/decoding into store...
r8531 # This avoids a collision between a file named foo and a dir named
# foo.i or foo.d
Adrian Buehlmann
store: use fast C implementation of encodedir() if it's available...
r17607 def _encodedir(path):
Augie Fackler
formating: upgrade to black 20.8b1...
r46554 """
Yuya Nishihara
doctest: bulk-replace string literals with b'' for Python 3...
r34133 >>> _encodedir(b'data/foo.i')
Adrian Buehlmann
store: add some doctests
r13949 'data/foo.i'
Yuya Nishihara
doctest: bulk-replace string literals with b'' for Python 3...
r34133 >>> _encodedir(b'data/foo.i/bla.i')
Adrian Buehlmann
store: add some doctests
r13949 'data/foo.i.hg/bla.i'
Yuya Nishihara
doctest: bulk-replace string literals with b'' for Python 3...
r34133 >>> _encodedir(b'data/foo.i.hg/bla.i')
Adrian Buehlmann
store: add some doctests
r13949 'data/foo.i.hg.hg/bla.i'
Yuya Nishihara
doctest: bulk-replace string literals with b'' for Python 3...
r34133 >>> _encodedir(b'data/foo.i\\ndata/foo.i/bla.i\\ndata/foo.i.hg/bla.i\\n')
Adrian Buehlmann
store: add multiline doctest case for encodedir()...
r17605 'data/foo.i\\ndata/foo.i.hg/bla.i\\ndata/foo.i.hg.hg/bla.i\\n'
Augie Fackler
formating: upgrade to black 20.8b1...
r46554 """
Augie Fackler
formatting: blacken the codebase...
r43346 return (
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 path.replace(b".hg/", b".hg.hg/")
.replace(b".i/", b".i.hg/")
.replace(b".d/", b".d.hg/")
Augie Fackler
formatting: blacken the codebase...
r43346 )
Benoit Boissinot
filelog encoding: move the encoding/decoding into store...
r8531
Adrian Buehlmann
store: use fast C implementation of encodedir() if it's available...
r17607 encodedir = getattr(parsers, 'encodedir', _encodedir)
Augie Fackler
formatting: blacken the codebase...
r43346
Benoit Boissinot
filelog encoding: move the encoding/decoding into store...
r8531 def decodedir(path):
Augie Fackler
formating: upgrade to black 20.8b1...
r46554 """
Yuya Nishihara
doctest: bulk-replace string literals with b'' for Python 3...
r34133 >>> decodedir(b'data/foo.i')
Adrian Buehlmann
store: add some doctests
r13949 'data/foo.i'
Yuya Nishihara
doctest: bulk-replace string literals with b'' for Python 3...
r34133 >>> decodedir(b'data/foo.i.hg/bla.i')
Adrian Buehlmann
store: add some doctests
r13949 'data/foo.i/bla.i'
Yuya Nishihara
doctest: bulk-replace string literals with b'' for Python 3...
r34133 >>> decodedir(b'data/foo.i.hg.hg/bla.i')
Adrian Buehlmann
store: add some doctests
r13949 'data/foo.i.hg/bla.i'
Augie Fackler
formating: upgrade to black 20.8b1...
r46554 """
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 if b".hg/" not in path:
Benoit Boissinot
filelog encoding: move the encoding/decoding into store...
r8531 return path
Augie Fackler
formatting: blacken the codebase...
r43346 return (
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 path.replace(b".d.hg/", b".d/")
.replace(b".i.hg/", b".i/")
.replace(b".hg.hg/", b".hg/")
Augie Fackler
formatting: blacken the codebase...
r43346 )
Benoit Boissinot
filelog encoding: move the encoding/decoding into store...
r8531
timeless
store: treat range as a generator instead of a list for py3 compat
r29071 def _reserved():
Augie Fackler
formating: upgrade to black 20.8b1...
r46554 """characters that are problematic for filesystems
timeless
store: treat range as a generator instead of a list for py3 compat
r29071
* ascii escapes (0..31)
* ascii hi (126..255)
* windows specials
these characters will be escaped by encodefunctions
Augie Fackler
formating: upgrade to black 20.8b1...
r46554 """
Mateusz Kwapich
py3: make the string unicode so its iterable in py3k
r30076 winreserved = [ord(x) for x in u'\\:*?"<>|']
timeless
store: treat range as a generator instead of a list for py3 compat
r29071 for x in range(32):
yield x
for x in range(126, 256):
yield x
for x in winreserved:
yield x
Augie Fackler
formatting: blacken the codebase...
r43346
Adrian Buehlmann
move filename encoding functions from util.py to new store.py
r6839 def _buildencodefun():
Augie Fackler
formating: upgrade to black 20.8b1...
r46554 """
Adrian Buehlmann
store: add some doctests
r13949 >>> enc, dec = _buildencodefun()
Yuya Nishihara
doctest: bulk-replace string literals with b'' for Python 3...
r34133 >>> enc(b'nothing/special.txt')
Adrian Buehlmann
store: add some doctests
r13949 'nothing/special.txt'
Yuya Nishihara
doctest: bulk-replace string literals with b'' for Python 3...
r34133 >>> dec(b'nothing/special.txt')
Adrian Buehlmann
store: add some doctests
r13949 'nothing/special.txt'
Yuya Nishihara
doctest: bulk-replace string literals with b'' for Python 3...
r34133 >>> enc(b'HELLO')
Adrian Buehlmann
store: add some doctests
r13949 '_h_e_l_l_o'
Yuya Nishihara
doctest: bulk-replace string literals with b'' for Python 3...
r34133 >>> dec(b'_h_e_l_l_o')
Adrian Buehlmann
store: add some doctests
r13949 'HELLO'
Yuya Nishihara
doctest: bulk-replace string literals with b'' for Python 3...
r34133 >>> enc(b'hello:world?')
Adrian Buehlmann
store: add some doctests
r13949 'hello~3aworld~3f'
Yuya Nishihara
doctest: bulk-replace string literals with b'' for Python 3...
r34133 >>> dec(b'hello~3aworld~3f')
Adrian Buehlmann
store: add some doctests
r13949 'hello:world?'
Yuya Nishihara
doctest: do not embed non-ascii characters in docstring...
r34138 >>> enc(b'the\\x07quick\\xADshot')
Adrian Buehlmann
store: add some doctests
r13949 'the~07quick~adshot'
Yuya Nishihara
doctest: bulk-replace string literals with b'' for Python 3...
r34133 >>> dec(b'the~07quick~adshot')
Adrian Buehlmann
store: add some doctests
r13949 'the\\x07quick\\xadshot'
Augie Fackler
formating: upgrade to black 20.8b1...
r46554 """
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 e = b'_'
Yuya Nishihara
py3: factor out bytechr() function...
r31253 xchr = pycompat.bytechr
asciistr = list(map(xchr, range(127)))
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 capitals = list(range(ord(b"A"), ord(b"Z") + 1))
Mateusz Kwapich
py3: make encodefun in store.py compatible with py3k...
r30077
Augie Fackler
cleanup: run pyupgrade on our source tree to clean up varying things...
r44937 cmap = {x: x for x in asciistr}
timeless
store: treat range as a generator instead of a list for py3 compat
r29071 for x in _reserved():
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 cmap[xchr(x)] = b"~%02x" % x
Mateusz Kwapich
py3: make encodefun in store.py compatible with py3k...
r30077 for x in capitals + [ord(e)]:
cmap[xchr(x)] = e + xchr(x).lower()
Adrian Buehlmann
move filename encoding functions from util.py to new store.py
r6839 dmap = {}
Gregory Szorc
global: bulk replace simple pycompat.iteritems(x) with x.items()...
r49768 for k, v in cmap.items():
Adrian Buehlmann
move filename encoding functions from util.py to new store.py
r6839 dmap[v] = k
Augie Fackler
formatting: blacken the codebase...
r43346
Adrian Buehlmann
move filename encoding functions from util.py to new store.py
r6839 def decode(s):
i = 0
while i < len(s):
Gregory Szorc
global: use pycompat.xrange()...
r38806 for l in pycompat.xrange(1, 4):
Adrian Buehlmann
move filename encoding functions from util.py to new store.py
r6839 try:
Augie Fackler
formatting: blacken the codebase...
r43346 yield dmap[s[i : i + l]]
Adrian Buehlmann
move filename encoding functions from util.py to new store.py
r6839 i += l
break
except KeyError:
pass
else:
raise KeyError
Augie Fackler
formatting: blacken the codebase...
r43346
return (
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 lambda s: b''.join(
Augie Fackler
formatting: blacken the codebase...
r43346 [cmap[s[c : c + 1]] for c in pycompat.xrange(len(s))]
),
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 lambda s: b''.join(list(decode(s))),
Augie Fackler
formatting: blacken the codebase...
r43346 )
Adrian Buehlmann
store: extract functions _encodefname and _decodefname
r17608
_encodefname, _decodefname = _buildencodefun()
Adrian Buehlmann
move filename encoding functions from util.py to new store.py
r6839
Augie Fackler
formatting: blacken the codebase...
r43346
Adrian Buehlmann
store: extract functions _encodefname and _decodefname
r17608 def encodefilename(s):
Augie Fackler
formating: upgrade to black 20.8b1...
r46554 """
Yuya Nishihara
doctest: bulk-replace string literals with b'' for Python 3...
r34133 >>> encodefilename(b'foo.i/bar.d/bla.hg/hi:world?/HELLO')
Adrian Buehlmann
store: extract functions _encodefname and _decodefname
r17608 'foo.i.hg/bar.d.hg/bla.hg.hg/hi~3aworld~3f/_h_e_l_l_o'
Augie Fackler
formating: upgrade to black 20.8b1...
r46554 """
Adrian Buehlmann
store: extract functions _encodefname and _decodefname
r17608 return _encodefname(encodedir(s))
Augie Fackler
formatting: blacken the codebase...
r43346
Adrian Buehlmann
store: extract functions _encodefname and _decodefname
r17608 def decodefilename(s):
Augie Fackler
formating: upgrade to black 20.8b1...
r46554 """
Yuya Nishihara
doctest: bulk-replace string literals with b'' for Python 3...
r34133 >>> decodefilename(b'foo.i.hg/bar.d.hg/bla.hg.hg/hi~3aworld~3f/_h_e_l_l_o')
Adrian Buehlmann
store: extract functions _encodefname and _decodefname
r17608 'foo.i/bar.d/bla.hg/hi:world?/HELLO'
Augie Fackler
formating: upgrade to black 20.8b1...
r46554 """
Adrian Buehlmann
store: extract functions _encodefname and _decodefname
r17608 return decodedir(_decodefname(s))
Adrian Buehlmann
move filename encoding functions from util.py to new store.py
r6839
Augie Fackler
formatting: blacken the codebase...
r43346
Adrian Buehlmann
store: change names to comply with project coding standards...
r14288 def _buildlowerencodefun():
Augie Fackler
formating: upgrade to black 20.8b1...
r46554 """
Adrian Buehlmann
store: change names to comply with project coding standards...
r14288 >>> f = _buildlowerencodefun()
Yuya Nishihara
doctest: bulk-replace string literals with b'' for Python 3...
r34133 >>> f(b'nothing/special.txt')
Adrian Buehlmann
store: add some doctests
r13949 'nothing/special.txt'
Yuya Nishihara
doctest: bulk-replace string literals with b'' for Python 3...
r34133 >>> f(b'HELLO')
Adrian Buehlmann
store: add some doctests
r13949 'hello'
Yuya Nishihara
doctest: bulk-replace string literals with b'' for Python 3...
r34133 >>> f(b'hello:world?')
Adrian Buehlmann
store: add some doctests
r13949 'hello~3aworld~3f'
Yuya Nishihara
doctest: do not embed non-ascii characters in docstring...
r34138 >>> f(b'the\\x07quick\\xADshot')
Adrian Buehlmann
store: add some doctests
r13949 'the~07quick~adshot'
Augie Fackler
formating: upgrade to black 20.8b1...
r46554 """
Yuya Nishihara
py3: use bytechr() in store._buildlowerencodefun()
r34211 xchr = pycompat.bytechr
Augie Fackler
cleanup: run pyupgrade on our source tree to clean up varying things...
r44937 cmap = {xchr(x): xchr(x) for x in pycompat.xrange(127)}
timeless
store: treat range as a generator instead of a list for py3 compat
r29071 for x in _reserved():
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 cmap[xchr(x)] = b"~%02x" % x
for x in range(ord(b"A"), ord(b"Z") + 1):
Yuya Nishihara
py3: use bytechr() in store._buildlowerencodefun()
r34211 cmap[xchr(x)] = xchr(x).lower()
Augie Fackler
formatting: blacken the codebase...
r43346
Yuya Nishihara
store: give name to lowerencode function...
r34210 def lowerencode(s):
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 return b"".join([cmap[c] for c in pycompat.iterbytestr(s)])
Augie Fackler
formatting: blacken the codebase...
r43346
Yuya Nishihara
store: give name to lowerencode function...
r34210 return lowerencode
Adrian Buehlmann
introduce fncache repository layout...
r7229
Augie Fackler
formatting: blacken the codebase...
r43346
Bryan O'Sullivan
store: implement lowerencode in C
r18430 lowerencode = getattr(parsers, 'lowerencode', None) or _buildlowerencodefun()
Adrian Buehlmann
introduce fncache repository layout...
r7229
Adrian Buehlmann
store: optimze _auxencode() a bit by grouping the reserved names by length...
r17570 # Windows reserved names: con, prn, aux, nul, com1..com9, lpt1..lpt9
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 _winres3 = (b'aux', b'con', b'prn', b'nul') # length 3
_winres4 = (b'com', b'lpt') # length 4 (with trailing 1..9)
Augie Fackler
formatting: blacken the codebase...
r43346
Adrian Buehlmann
store: encode first period or space in filenames (issue1713)...
r12687 def _auxencode(path, dotencode):
Augie Fackler
formating: upgrade to black 20.8b1...
r46554 """
Adrian Buehlmann
store: add some doctests
r13949 Encodes filenames containing names reserved by Windows or which end in
period or space. Does not touch other single reserved characters c.
Specifically, c in '\\:*?"<>|' or ord(c) <= 31 are *not* encoded here.
Additionally encodes space or period at the beginning, if dotencode is
Adrian Buehlmann
store: explain "aux.foo" versus "foo.aux" in doc of _auxencode()
r17569 True. Parameter path is assumed to be all lowercase.
A segment only needs encoding if a reserved name appears as a
basename (e.g. "aux", "aux.foo"). A directory or file named "foo.aux"
doesn't need encoding.
Adrian Buehlmann
store: add some doctests
r13949
Yuya Nishihara
doctest: bulk-replace string literals with b'' for Python 3...
r34133 >>> s = b'.foo/aux.txt/txt.aux/con/prn/nul/foo.'
>>> _auxencode(s.split(b'/'), True)
Adrian Buehlmann
store: let _auxencode() return the list of path segments...
r17574 ['~2efoo', 'au~78.txt', 'txt.aux', 'co~6e', 'pr~6e', 'nu~6c', 'foo~2e']
Yuya Nishihara
doctest: bulk-replace string literals with b'' for Python 3...
r34133 >>> s = b'.com1com2/lpt9.lpt4.lpt1/conprn/com0/lpt0/foo.'
>>> _auxencode(s.split(b'/'), False)
Adrian Buehlmann
store: let _auxencode() return the list of path segments...
r17574 ['.com1com2', 'lp~749.lpt4.lpt1', 'conprn', 'com0', 'lpt0', 'foo~2e']
Yuya Nishihara
doctest: bulk-replace string literals with b'' for Python 3...
r34133 >>> _auxencode([b'foo. '], True)
Adrian Buehlmann
store: let _auxencode() return the list of path segments...
r17574 ['foo.~20']
Yuya Nishihara
doctest: bulk-replace string literals with b'' for Python 3...
r34133 >>> _auxencode([b' .foo'], True)
Adrian Buehlmann
store: let _auxencode() return the list of path segments...
r17574 ['~20.foo']
Augie Fackler
formating: upgrade to black 20.8b1...
r46554 """
Adrian Buehlmann
store: parameter path of _auxencode is now a list of strings
r17589 for i, n in enumerate(path):
Adrian Buehlmann
store: unindent most of the contents of the for loop in _auxencode()...
r17572 if not n:
continue
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 if dotencode and n[0] in b'. ':
n = b"~%02x" % ord(n[0:1]) + n[1:]
Adrian Buehlmann
store: parameter path of _auxencode is now a list of strings
r17589 path[i] = n
Adrian Buehlmann
store: unindent most of the contents of the for loop in _auxencode()...
r17572 else:
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 l = n.find(b'.')
Adrian Buehlmann
store: unindent most of the contents of the for loop in _auxencode()...
r17572 if l == -1:
l = len(n)
Augie Fackler
formatting: blacken the codebase...
r43346 if (l == 3 and n[:3] in _winres3) or (
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 l == 4
and n[3:4] <= b'9'
and n[3:4] >= b'1'
and n[:3] in _winres4
Augie Fackler
formatting: blacken the codebase...
r43346 ):
Adrian Buehlmann
store: unindent most of the contents of the for loop in _auxencode()...
r17572 # encode third letter ('aux' -> 'au~78')
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 ec = b"~%02x" % ord(n[2:3])
Adrian Buehlmann
store: unindent most of the contents of the for loop in _auxencode()...
r17572 n = n[0:2] + ec + n[3:]
Adrian Buehlmann
store: parameter path of _auxencode is now a list of strings
r17589 path[i] = n
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 if n[-1] in b'. ':
Adrian Buehlmann
store: unindent most of the contents of the for loop in _auxencode()...
r17572 # encode last period or space ('foo...' -> 'foo..~2e')
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 path[i] = n[:-1] + b"~%02x" % ord(n[-1:])
Adrian Buehlmann
store: parameter path of _auxencode is now a list of strings
r17589 return path
Adrian Buehlmann
introduce fncache repository layout...
r7229
Augie Fackler
formatting: blacken the codebase...
r43346
Adrian Buehlmann
store: change names to comply with project coding standards...
r14288 _maxstorepathlen = 120
_dirprefixlen = 8
_maxshortdirslen = 8 * (_dirprefixlen + 1) - 4
Bryan O'Sullivan
store: refactor hashed encoding into its own function
r17610
Augie Fackler
formatting: blacken the codebase...
r43346
Bryan O'Sullivan
store: refactor hashed encoding into its own function
r17610 def _hashencode(path, dotencode):
Joerg Sonnenberger
node: import symbols explicitly...
r46729 digest = hex(hashutil.sha1(path).digest())
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 le = lowerencode(path[5:]).split(b'/') # skips prefix 'data/' or 'meta/'
Bryan O'Sullivan
store: refactor hashed encoding into its own function
r17610 parts = _auxencode(le, dotencode)
basename = parts[-1]
_root, ext = os.path.splitext(basename)
sdirs = []
sdirslen = 0
for p in parts[:-1]:
d = p[:_dirprefixlen]
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 if d[-1] in b'. ':
Bryan O'Sullivan
store: refactor hashed encoding into its own function
r17610 # Windows can't access dirs ending in period or space
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 d = d[:-1] + b'_'
Bryan O'Sullivan
store: refactor hashed encoding into its own function
r17610 if sdirslen == 0:
t = len(d)
else:
t = sdirslen + 1 + len(d)
if t > _maxshortdirslen:
break
sdirs.append(d)
sdirslen = t
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 dirs = b'/'.join(sdirs)
Bryan O'Sullivan
store: refactor hashed encoding into its own function
r17610 if len(dirs) > 0:
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 dirs += b'/'
res = b'dh/' + dirs + digest + ext
Bryan O'Sullivan
store: refactor hashed encoding into its own function
r17610 spaceleft = _maxstorepathlen - len(res)
if spaceleft > 0:
filler = basename[:spaceleft]
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 res = b'dh/' + dirs + filler + digest + ext
Bryan O'Sullivan
store: refactor hashed encoding into its own function
r17610 return res
Augie Fackler
formatting: blacken the codebase...
r43346
Adrian Buehlmann
store: eliminate one level of lambda functions on _hybridencode
r17590 def _hybridencode(path, dotencode):
Augie Fackler
formating: upgrade to black 20.8b1...
r46554 """encodes path with a length limit
Adrian Buehlmann
introduce fncache repository layout...
r7229
Encodes all paths that begin with 'data/', according to the following.
Default encoding (reversible):
Encodes all uppercase letters 'X' as '_x'. All reserved or illegal
characters are encoded as '~xx', where xx is the two digit hex code
of the character (see encodefilename).
Relevant path components consisting of Windows reserved filenames are
Mads Kiilerich
spelling: fix minor spell checker issues
r17738 masked by encoding the third character ('aux' -> 'au~78', see _auxencode).
Adrian Buehlmann
introduce fncache repository layout...
r7229
Hashed encoding (not reversible):
Adrian Buehlmann
store: change names to comply with project coding standards...
r14288 If the default-encoded path is longer than _maxstorepathlen, a
Adrian Buehlmann
introduce fncache repository layout...
r7229 non-reversible hybrid hashing of the path is done instead.
Adrian Buehlmann
store: change names to comply with project coding standards...
r14288 This encoding uses up to _dirprefixlen characters of all directory
Adrian Buehlmann
introduce fncache repository layout...
r7229 levels of the lowerencoded path, but not more levels than can fit into
Adrian Buehlmann
store: change names to comply with project coding standards...
r14288 _maxshortdirslen.
Adrian Buehlmann
introduce fncache repository layout...
r7229 Then follows the filler followed by the sha digest of the full path.
The filler is the beginning of the basename of the lowerencoded path
(the basename is everything after the last path separator). The filler
is as long as possible, filling in characters from the basename until
Adrian Buehlmann
store: change names to comply with project coding standards...
r14288 the encoded path has _maxstorepathlen characters (or all chars of the
basename have been taken).
Adrian Buehlmann
introduce fncache repository layout...
r7229 The extension (e.g. '.i' or '.d') is preserved.
The string 'data/' at the beginning is replaced with 'dh/', if the hashed
encoding was used.
Augie Fackler
formating: upgrade to black 20.8b1...
r46554 """
Adrian Buehlmann
store: reuse direncoded path in _hybridencode...
r17609 path = encodedir(path)
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 ef = _encodefname(path).split(b'/')
res = b'/'.join(_auxencode(ef, dotencode))
Adrian Buehlmann
store: change names to comply with project coding standards...
r14288 if len(res) > _maxstorepathlen:
Bryan O'Sullivan
store: refactor hashed encoding into its own function
r17610 res = _hashencode(path, dotencode)
Adrian Buehlmann
introduce fncache repository layout...
r7229 return res
Augie Fackler
formatting: blacken the codebase...
r43346
Adrian Buehlmann
store: add a fallback _pathencode Python function...
r17624 def _pathencode(path):
Bryan O'Sullivan
store: switch to C-based hashed path encoding
r18435 de = encodedir(path)
Adrian Buehlmann
store: optimize _pathencode by checking the length of the unencoded path...
r17693 if len(path) > _maxstorepathlen:
Bryan O'Sullivan
store: switch to C-based hashed path encoding
r18435 return _hashencode(de, True)
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 ef = _encodefname(de).split(b'/')
res = b'/'.join(_auxencode(ef, True))
Adrian Buehlmann
store: add a fallback _pathencode Python function...
r17624 if len(res) > _maxstorepathlen:
Bryan O'Sullivan
store: switch to C-based hashed path encoding
r18435 return _hashencode(de, True)
Adrian Buehlmann
store: add a fallback _pathencode Python function...
r17624 return res
Augie Fackler
formatting: blacken the codebase...
r43346
Adrian Buehlmann
store: add a fallback _pathencode Python function...
r17624 _pathencode = getattr(parsers, 'pathencode', _pathencode)
Augie Fackler
formatting: blacken the codebase...
r43346
Adrian Buehlmann
store: move _plainhybridencode and _dothybridencode higher up in the file...
r17623 def _plainhybridencode(f):
return _hybridencode(f, False)
Augie Fackler
formatting: blacken the codebase...
r43346
FUJIWARA Katsunori
store: invoke "os.stat()" for "createmode" initialization via vfs...
r17726 def _calcmode(vfs):
Matt Mackall
store: simplify class hierarchy
r6898 try:
# files in .hg/ will be created using this mode
FUJIWARA Katsunori
store: invoke "os.stat()" for "createmode" initialization via vfs...
r17726 mode = vfs.stat().st_mode
Augie Fackler
formatting: blacken the codebase...
r43346 # avoid some useless chmods
Gregory Szorc
global: mass rewrite to use modern octal syntax...
r25658 if (0o777 & ~util.umask) == (0o777 & mode):
Matt Mackall
store: simplify class hierarchy
r6898 mode = None
except OSError:
mode = None
return mode
Augie Fackler
formatting: blacken the codebase...
r43346
Pulkit Goyal
store: refactor space delimited list to proper data structure...
r45911 _data = [
b'bookmarks',
b'narrowspec',
b'data',
b'meta',
b'00manifest.d',
b'00manifest.i',
b'00changelog.d',
b'00changelog.i',
b'phaseroots',
b'obsstore',
Pulkit Goyal
share: introduce config option to store requires in .hg/store...
r46055 b'requires',
Pulkit Goyal
store: refactor space delimited list to proper data structure...
r45911 ]
Augie Fackler
formatting: blacken the codebase...
r43346
store: also return some information about the type of file `walk` found...
r47657 REVLOG_FILES_MAIN_EXT = (b'.i', b'i.tmpcensored')
revlogv2: use a unique filename for data...
r48115 REVLOG_FILES_OTHER_EXT = (
b'.idx',
b'.d',
b'.dat',
b'.n',
b'.nd',
revlog: store sidedata in their own file...
r48181 b'.sda',
revlogv2: use a unique filename for data...
r48115 b'd.tmpcensored',
)
streamclone: treat volatile file as "fullfile"...
r47751 # files that are "volatile" and might change between listing and streaming
#
# note: the ".nd" file are nodemap data and won't "change" but they might be
# deleted.
REVLOG_FILES_VOLATILE_EXT = (b'.n', b'.nd')
store: also return some information about the type of file `walk` found...
r47657
store: exclude `undo.` nodemap's file from `walk`...
r47752 # some exception to the above matching
walk: no longer ignore revlogs of files starting with `undo.` (issue6542)...
r48459 #
# XXX This is currently not in use because of issue6542
revlogv2: introduce a very basic docket file...
r48008 EXCLUDED = re.compile(b'.*undo\.[^/]+\.(nd?|i)$')
store: exclude `undo.` nodemap's file from `walk`...
r47752
store: also return some information about the type of file `walk` found...
r47657
def is_revlog(f, kind, st):
if kind != stat.S_IFREG:
return None
return revlog_type(f)
def revlog_type(f):
walk: no longer ignore revlogs of files starting with `undo.` (issue6542)...
r48459 # XXX we need to filter `undo.` created by the transaction here, however
# being naive about it also filter revlog for `undo.*` files, leading to
# issue6542. So we no longer use EXCLUDED.
if f.endswith(REVLOG_FILES_MAIN_EXT):
store: also return some information about the type of file `walk` found...
r47657 return FILEFLAGS_REVLOG_MAIN
walk: no longer ignore revlogs of files starting with `undo.` (issue6542)...
r48459 elif f.endswith(REVLOG_FILES_OTHER_EXT):
streamclone: treat volatile file as "fullfile"...
r47751 t = FILETYPE_FILELOG_OTHER
if f.endswith(REVLOG_FILES_VOLATILE_EXT):
t |= FILEFLAGS_VOLATILE
return t
revlogv2: use a unique filename for data...
r48115 return None
store: use `endswith` to detect revlog extension...
r47112
Matt Mackall
clone: get a list of files to clone from store
r6903
store: also return some information about the type of file `walk` found...
r47657 # the file is part of changelog data
FILEFLAGS_CHANGELOG = 1 << 13
# the file is part of manifest data
FILEFLAGS_MANIFESTLOG = 1 << 12
# the file is part of filelog data
FILEFLAGS_FILELOG = 1 << 11
# file that are not directly part of a revlog
FILEFLAGS_OTHER = 1 << 10
# the main entry point for a revlog
FILEFLAGS_REVLOG_MAIN = 1 << 1
# a secondary file for a revlog
FILEFLAGS_REVLOG_OTHER = 1 << 0
streamclone: treat volatile file as "fullfile"...
r47751 # files that are "volatile" and might change between listing and streaming
FILEFLAGS_VOLATILE = 1 << 20
store: also return some information about the type of file `walk` found...
r47657 FILETYPE_CHANGELOG_MAIN = FILEFLAGS_CHANGELOG | FILEFLAGS_REVLOG_MAIN
FILETYPE_CHANGELOG_OTHER = FILEFLAGS_CHANGELOG | FILEFLAGS_REVLOG_OTHER
FILETYPE_MANIFESTLOG_MAIN = FILEFLAGS_MANIFESTLOG | FILEFLAGS_REVLOG_MAIN
FILETYPE_MANIFESTLOG_OTHER = FILEFLAGS_MANIFESTLOG | FILEFLAGS_REVLOG_OTHER
FILETYPE_FILELOG_MAIN = FILEFLAGS_FILELOG | FILEFLAGS_REVLOG_MAIN
FILETYPE_FILELOG_OTHER = FILEFLAGS_FILELOG | FILEFLAGS_REVLOG_OTHER
FILETYPE_OTHER = FILEFLAGS_OTHER
Gregory Szorc
store: make file filtering during walk configurable...
r37427
Augie Fackler
formatting: blacken the codebase...
r43346
Gregory Szorc
py3: use class X: instead of class X(object):...
r49801 class basicstore:
Adrian Buehlmann
introduce store classes...
r6840 '''base class for local repository stores'''
Augie Fackler
formatting: blacken the codebase...
r43346
FUJIWARA Katsunori
store: rename "openertype" argument to "vfstype"
r17651 def __init__(self, path, vfstype):
FUJIWARA Katsunori
store: initialize vfs field first to use it for initialization of others...
r17724 vfs = vfstype(path)
self.path = vfs.base
FUJIWARA Katsunori
store: invoke "os.stat()" for "createmode" initialization via vfs...
r17726 self.createmode = _calcmode(vfs)
FUJIWARA Katsunori
store: rename "op" variables to "vfs"
r17652 vfs.createmode = self.createmode
FUJIWARA Katsunori
store: invoke "os.path.isdir()" via vfs...
r17728 self.rawvfs = vfs
Pierre-Yves David
vfs: use 'vfs' module directly in 'mercurial.store'...
r31234 self.vfs = vfsmod.filtervfs(vfs, encodedir)
FUJIWARA Katsunori
store: initialize "vfs" fields by "vfs" constructors...
r17653 self.opener = self.vfs
Adrian Buehlmann
introduce store classes...
r6840
def join(self, f):
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 return self.path + b'/' + encodedir(f)
Adrian Buehlmann
introduce store classes...
r6840
store: drop the `filefilter` argument to `_walk`...
r47613 def _walk(self, relpath, recurse):
Valentin Gatien-Baron
store: return just one filename in walk functions...
r48691 '''yields (revlog_type, unencoded, size)'''
Adrian Buehlmann
store: remove pointless pathjoiner parameter...
r13426 path = self.path
if relpath:
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 path += b'/' + relpath
Adrian Buehlmann
store: remove pointless pathjoiner parameter...
r13426 striplen = len(self.path) + 1
Matt Mackall
store: simplify walking...
r6899 l = []
FUJIWARA Katsunori
store: invoke "os.path.isdir()" via vfs...
r17728 if self.rawvfs.isdir(path):
Matt Mackall
store: simplify walking...
r6899 visit = [path]
FUJIWARA Katsunori
store: invoke "osutil.listdir()" via vfs...
r17747 readdir = self.rawvfs.readdir
Matt Mackall
store: simplify walking...
r6899 while visit:
p = visit.pop()
FUJIWARA Katsunori
store: invoke "osutil.listdir()" via vfs...
r17747 for f, kind, st in readdir(p, stat=True):
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 fp = p + b'/' + f
store: also return some information about the type of file `walk` found...
r47657 rl_type = is_revlog(f, kind, st)
if rl_type is not None:
Matt Mackall
store: change handling of decoding errors
r6900 n = util.pconvert(fp[striplen:])
Valentin Gatien-Baron
store: return just one filename in walk functions...
r48691 l.append((rl_type, decodedir(n), st.st_size))
Matt Mackall
store: simplify walking...
r6899 elif kind == stat.S_IFDIR and recurse:
visit.append(fp)
Bryan O'Sullivan
store: sort filenames in place
r17054 l.sort()
return l
Adrian Buehlmann
introduce store classes...
r6840
Kyle Lippincott
revlog: add a mechanism to verify expected file position before appending...
r47349 def changelog(self, trypending, concurrencychecker=None):
return changelog.changelog(
self.vfs,
trypending=trypending,
concurrencychecker=concurrencychecker,
)
Augie Fackler
localrepo: push manifestlog and changelog construction code into store...
r43175
def manifestlog(self, repo, storenarrowmatch):
Joerg Sonnenberger
node: introduce nodeconstants class...
r47538 rootstore = manifest.manifestrevlog(repo.nodeconstants, self.vfs)
Augie Fackler
formatting: blacken the codebase...
r43346 return manifest.manifestlog(self.vfs, repo, rootstore, storenarrowmatch)
Augie Fackler
localrepo: push manifestlog and changelog construction code into store...
r43175
Valentin Gatien-Baron
store: return just one filename in walk functions...
r48691 def datafiles(self, matcher=None, undecodable=None):
"""Like walk, but excluding the changelog and root manifest.
When [undecodable] is None, revlogs names that can't be
decoded cause an exception. When it is provided, it should
be a list and the filenames that can't be decoded are added
to it instead. This is very rarely needed."""
store: also return some information about the type of file `walk` found...
r47657 files = self._walk(b'data', True) + self._walk(b'meta', True)
Valentin Gatien-Baron
store: return just one filename in walk functions...
r48691 for (t, u, s) in files:
yield (FILEFLAGS_FILELOG | t, u, s)
Adrian Buehlmann
introduce store classes...
r6840
Durham Goode
store: move top file walk to a separate function...
r19177 def topfiles(self):
# yield manifest before changelog
store: also return some information about the type of file `walk` found...
r47657 files = reversed(self._walk(b'', False))
Valentin Gatien-Baron
store: return just one filename in walk functions...
r48691 for (t, u, s) in files:
store: also return some information about the type of file `walk` found...
r47657 if u.startswith(b'00changelog'):
Valentin Gatien-Baron
store: return just one filename in walk functions...
r48691 yield (FILEFLAGS_CHANGELOG | t, u, s)
store: also return some information about the type of file `walk` found...
r47657 elif u.startswith(b'00manifest'):
Valentin Gatien-Baron
store: return just one filename in walk functions...
r48691 yield (FILEFLAGS_MANIFESTLOG | t, u, s)
store: also return some information about the type of file `walk` found...
r47657 else:
Valentin Gatien-Baron
store: return just one filename in walk functions...
r48691 yield (FILETYPE_OTHER | t, u, s)
Durham Goode
store: move top file walk to a separate function...
r19177
Pulkit Goyal
store: pass matcher to store.datafiles()...
r40376 def walk(self, matcher=None):
store: document the `walk` method...
r47612 """return file related to data storage (ie: revlogs)
Valentin Gatien-Baron
store: return just one filename in walk functions...
r48691 yields (file_type, unencoded, size)
Pulkit Goyal
store: pass matcher to store.datafiles()...
r40376
if a matcher is passed, storage files of only those tracked paths
are passed with matches the matcher
Augie Fackler
formating: upgrade to black 20.8b1...
r46554 """
Adrian Buehlmann
introduce store classes...
r6840 # yield data files first
Pulkit Goyal
store: pass matcher to store.datafiles()...
r40376 for x in self.datafiles(matcher):
Adrian Buehlmann
introduce store classes...
r6840 yield x
Durham Goode
store: move top file walk to a separate function...
r19177 for x in self.topfiles():
Adrian Buehlmann
introduce store classes...
r6840 yield x
Matt Mackall
clone: get a list of files to clone from store
r6903 def copylist(self):
Pulkit Goyal
share: introduce config option to store requires in .hg/store...
r46055 return _data
Matt Mackall
clone: get a list of files to clone from store
r6903
Durham Goode
fncache: move fncache writing to be in a transaction...
r20883 def write(self, tr):
Adrian Buehlmann
fncachestore: defer updating the fncache file to a single file open...
r13391 pass
Durham Goode
caches: invalidate store caches when lock is taken...
r20884 def invalidatecaches(self):
pass
Durham Goode
fncache: clean up fncache during strips...
r20885 def markremoved(self, fn):
pass
smuralid
store: add a contains method to basicstore...
r17744 def __contains__(self, path):
'''Checks if the store contains path'''
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 path = b"/".join((b"data", path))
smuralid
store: add a contains method to basicstore...
r17744 # file?
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 if self.vfs.exists(path + b".i"):
smuralid
store: add a contains method to basicstore...
r17744 return True
# dir?
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 if not path.endswith(b"/"):
path = path + b"/"
FUJIWARA Katsunori
store: use "vfs.exists()" instead of "os.path.exists()"
r19903 return self.vfs.exists(path)
smuralid
store: add a contains method to basicstore...
r17744
Augie Fackler
formatting: blacken the codebase...
r43346
Matt Mackall
store: simplify class hierarchy
r6898 class encodedstore(basicstore):
FUJIWARA Katsunori
store: rename "openertype" argument to "vfstype"
r17651 def __init__(self, path, vfstype):
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 vfs = vfstype(path + b'/store')
FUJIWARA Katsunori
store: initialize vfs field first to use it for initialization of others...
r17724 self.path = vfs.base
FUJIWARA Katsunori
store: invoke "os.stat()" for "createmode" initialization via vfs...
r17726 self.createmode = _calcmode(vfs)
FUJIWARA Katsunori
store: rename "op" variables to "vfs"
r17652 vfs.createmode = self.createmode
FUJIWARA Katsunori
store: invoke "os.path.isdir()" via vfs...
r17728 self.rawvfs = vfs
Pierre-Yves David
vfs: use 'vfs' module directly in 'mercurial.store'...
r31234 self.vfs = vfsmod.filtervfs(vfs, encodefilename)
FUJIWARA Katsunori
store: initialize "vfs" fields by "vfs" constructors...
r17653 self.opener = self.vfs
Adrian Buehlmann
introduce store classes...
r6840
store: document the decoding discrepancy in store.py...
r48589 # note: topfiles would also need a decode phase. It is just that in
# practice we do not have any file outside of `data/` that needs encoding.
# However that might change so we should probably add a test and encoding
# decoding for it too. see issue6548
Valentin Gatien-Baron
store: return just one filename in walk functions...
r48691 def datafiles(self, matcher=None, undecodable=None):
for t, f1, size in super(encodedstore, self).datafiles():
Adrian Buehlmann
verify: check repo.store
r6892 try:
Valentin Gatien-Baron
store: return just one filename in walk functions...
r48691 f2 = decodefilename(f1)
Adrian Buehlmann
verify: check repo.store
r6892 except KeyError:
Valentin Gatien-Baron
store: return just one filename in walk functions...
r48691 if undecodable is None:
msg = _(b'undecodable revlog name %s') % f1
raise error.StorageError(msg)
else:
undecodable.append(f1)
continue
if not _matchtrackedpath(f2, matcher):
Yuya Nishihara
store: pass in decoded filename to narrow matcher
r40620 continue
Valentin Gatien-Baron
store: return just one filename in walk functions...
r48691 yield t, f2, size
Adrian Buehlmann
introduce store classes...
r6840
def join(self, f):
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 return self.path + b'/' + encodefilename(f)
Adrian Buehlmann
introduce store classes...
r6840
Matt Mackall
clone: get a list of files to clone from store
r6903 def copylist(self):
Pulkit Goyal
store: refactor space delimited list to proper data structure...
r45911 return [b'requires', b'00changelog.i'] + [b'store/' + f for f in _data]
Augie Fackler
formatting: blacken the codebase...
r43346
Matt Mackall
clone: get a list of files to clone from store
r6903
Gregory Szorc
py3: use class X: instead of class X(object):...
r49801 class fncache:
Benoit Boissinot
filelog encoding: move the encoding/decoding into store...
r8531 # the filename used to be partially encoded
# hence the encodedir/decodedir dance
FUJIWARA Katsunori
store: rename field name from "opener" to "vfs" in internal classes for fncache...
r17722 def __init__(self, vfs):
self.vfs = vfs
Adrian Buehlmann
introduce fncache repository layout...
r7229 self.entries = None
Adrian Buehlmann
fncachestore: defer updating the fncache file to a single file open...
r13391 self._dirty = False
Pulkit Goyal
store: append to fncache if there are only new files to write...
r40767 # set of new additions to fncache
self.addls = set()
Adrian Buehlmann
introduce fncache repository layout...
r7229
Valentin Gatien-Baron
fncache: make debugrebuildfncache not fail on broken fncache...
r42960 def ensureloaded(self, warn=None):
Augie Fackler
formating: upgrade to black 20.8b1...
r46554 """read the fncache file if not already read.
Valentin Gatien-Baron
fncache: make debugrebuildfncache not fail on broken fncache...
r42960
If the file on disk is corrupted, raise. If warn is provided,
Augie Fackler
formating: upgrade to black 20.8b1...
r46554 warn and keep going instead."""
Valentin Gatien-Baron
fncache: make debugrebuildfncache not fail on broken fncache...
r42960 if self.entries is None:
self._load(warn)
def _load(self, warn=None):
Benoit Boissinot
store: refactor the fncache handling...
r8530 '''fill the entries from the fncache file'''
Adrian Buehlmann
fncachestore: defer updating the fncache file to a single file open...
r13391 self._dirty = False
Benoit Boissinot
store: refactor the fncache handling...
r8530 try:
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 fp = self.vfs(b'fncache', mode=b'rb')
Benoit Boissinot
store: refactor the fncache handling...
r8530 except IOError:
# skip nonexistent file
Bryan O'Sullivan
store: speed up read and write of large fncache files...
r16404 self.entries = set()
Benoit Boissinot
store: refactor the fncache handling...
r8530 return
Pulkit Goyal
store: don't read the whole fncache in memory...
r42144
self.entries = set()
chunk = b''
for c in iter(functools.partial(fp.read, fncache_chunksize), b''):
chunk += c
try:
p = chunk.rindex(b'\n')
Augie Fackler
formatting: blacken the codebase...
r43346 self.entries.update(decodedir(chunk[: p + 1]).splitlines())
chunk = chunk[p + 1 :]
Pulkit Goyal
store: don't read the whole fncache in memory...
r42144 except ValueError:
# substring '\n' not found, maybe the entry is bigger than the
# chunksize, so let's keep iterating
pass
Pulkit Goyal
store: error out if fncache does not ends with a newline...
r42147 if chunk:
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 msg = _(b"fncache does not ends with a newline")
Valentin Gatien-Baron
fncache: make debugrebuildfncache not fail on broken fncache...
r42960 if warn:
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 warn(msg + b'\n')
Valentin Gatien-Baron
fncache: make debugrebuildfncache not fail on broken fncache...
r42960 else:
Augie Fackler
formatting: blacken the codebase...
r43346 raise error.Abort(
msg,
hint=_(
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 b"use 'hg debugrebuildfncache' to "
b"rebuild the fncache"
Augie Fackler
formatting: blacken the codebase...
r43346 ),
)
Valentin Gatien-Baron
fncache: make debugrebuildfncache not fail on broken fncache...
r42960 self._checkentries(fp, warn)
Pulkit Goyal
store: move logic to check for invalid entry in fncache to own function...
r42139 fp.close()
Valentin Gatien-Baron
fncache: make debugrebuildfncache not fail on broken fncache...
r42960 def _checkentries(self, fp, warn):
Kyle Lippincott
black: make codebase compatible with black v21.4b2 and v20.8b1...
r47856 """make sure there is no empty string in entries"""
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 if b'' in self.entries:
Bryan O'Sullivan
store: speed up read and write of large fncache files...
r16404 fp.seek(0)
Gregory Szorc
py3: stop using util.iterfile()...
r49796 for n, line in enumerate(fp):
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 if not line.rstrip(b'\n'):
t = _(b'invalid entry in fncache, line %d') % (n + 1)
Valentin Gatien-Baron
fncache: make debugrebuildfncache not fail on broken fncache...
r42960 if warn:
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 warn(t + b'\n')
Valentin Gatien-Baron
fncache: make debugrebuildfncache not fail on broken fncache...
r42960 else:
raise error.Abort(t)
Adrian Buehlmann
introduce fncache repository layout...
r7229
Durham Goode
fncache: move fncache writing to be in a transaction...
r20883 def write(self, tr):
Bryan O'Sullivan
store: speed up read and write of large fncache files...
r16404 if self._dirty:
Boris Feld
store: assert the fncache have been loaded if dirty...
r38718 assert self.entries is not None
Pulkit Goyal
store: write fncache only once if there are both adds and removes...
r40779 self.entries = self.entries | self.addls
self.addls = set()
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 tr.addbackup(b'fncache')
fp = self.vfs(b'fncache', mode=b'wb', atomictemp=True)
Durham Goode
fncache: remove the rewriting logic...
r20879 if self.entries:
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 fp.write(encodedir(b'\n'.join(self.entries) + b'\n'))
Durham Goode
fncache: remove the rewriting logic...
r20879 fp.close()
self._dirty = False
Pulkit Goyal
store: append to fncache if there are only new files to write...
r40767 if self.addls:
# if we have just new entries, let's append them to the fncache
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 tr.addbackup(b'fncache')
fp = self.vfs(b'fncache', mode=b'ab', atomictemp=True)
Pulkit Goyal
store: append to fncache if there are only new files to write...
r40767 if self.addls:
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 fp.write(encodedir(b'\n'.join(self.addls) + b'\n'))
Pulkit Goyal
store: append to fncache if there are only new files to write...
r40767 fp.close()
self.entries = None
self.addls = set()
Benoit Boissinot
store: refactor the fncache handling...
r8530
def add(self, fn):
if self.entries is None:
self._load()
Adrian Buehlmann
store: only add new entries to the fncache file...
r10577 if fn not in self.entries:
Pulkit Goyal
store: append to fncache if there are only new files to write...
r40767 self.addls.add(fn)
Benoit Boissinot
store: refactor the fncache handling...
r8530
Durham Goode
fncache: clean up fncache during strips...
r20885 def remove(self, fn):
if self.entries is None:
self._load()
Pulkit Goyal
store: append to fncache if there are only new files to write...
r40767 if fn in self.addls:
self.addls.remove(fn)
return
Durham Goode
fncache: clean up fncache during strips...
r20885 try:
self.entries.remove(fn)
self._dirty = True
except KeyError:
pass
Adrian Buehlmann
store: move __contains__() implementation from class fncache into fncachestore...
r17782 def __contains__(self, fn):
Pulkit Goyal
store: append to fncache if there are only new files to write...
r40767 if fn in self.addls:
return True
Benoit Boissinot
store: refactor the fncache handling...
r8530 if self.entries is None:
self._load()
Adrian Buehlmann
store: move __contains__() implementation from class fncache into fncachestore...
r17782 return fn in self.entries
Benoit Boissinot
store: refactor the fncache handling...
r8530
def __iter__(self):
if self.entries is None:
self._load()
Pulkit Goyal
store: append to fncache if there are only new files to write...
r40767 return iter(self.entries | self.addls)
Adrian Buehlmann
introduce fncache repository layout...
r7229
Augie Fackler
formatting: blacken the codebase...
r43346
Boris Feld
vfs: fix proxyvfs inheritance...
r41125 class _fncachevfs(vfsmod.proxyvfs):
FUJIWARA Katsunori
store: rename argument name from "op"(ener) to "vfs"
r17721 def __init__(self, vfs, fnc, encode):
Yuya Nishihara
vfs: rename auditvfs to proxyvfs...
r33412 vfsmod.proxyvfs.__init__(self, vfs)
Adrian Buehlmann
store: break up reference cycle introduced in 9cbff8a39a2a...
r14194 self.fncache = fnc
self.encode = encode
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 def __call__(self, path, mode=b'r', *args, **kw):
Martijn Pieters
fncache: avoid loading the filename cache when not actually modifying it...
r38683 encoded = self.encode(path)
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 if mode not in (b'r', b'rb') and (
path.startswith(b'data/') or path.startswith(b'meta/')
Augie Fackler
formatting: blacken the codebase...
r43346 ):
Martijn Pieters
fncache: avoid loading the filename cache when not actually modifying it...
r38683 # do not trigger a fncache load when adding a file that already is
# known to exist.
notload = self.fncache.entries is None and self.vfs.exists(encoded)
revlog: open files in 'r+' instead of 'a+'...
r47991 if notload and b'r+' in mode and not self.vfs.stat(encoded).st_size:
Martijn Pieters
fncache: avoid loading the filename cache when not actually modifying it...
r38683 # when appending to an existing file, if the file has size zero,
# it should be considered as missing. Such zero-size files are
# the result of truncation when a transaction is aborted.
notload = False
if not notload:
self.fncache.add(path)
return self.vfs(encoded, mode, *args, **kw)
Adrian Buehlmann
store: break up reference cycle introduced in 9cbff8a39a2a...
r14194
FUJIWARA Katsunori
vfs: define "join()" in each classes derived from "abstractvfs"...
r17725 def join(self, path):
if path:
return self.vfs.join(self.encode(path))
else:
return self.vfs.join(path)
vfs: add a `register_file` method on the vfs class...
r48236 def register_file(self, path):
"""generic hook point to lets fncache steer its stew"""
if path.startswith(b'data/') or path.startswith(b'meta/'):
self.fncache.add(path)
Augie Fackler
formatting: blacken the codebase...
r43346
Adrian Buehlmann
introduce fncache repository layout...
r7229 class fncachestore(basicstore):
FUJIWARA Katsunori
store: rename "openertype" argument to "vfstype"
r17651 def __init__(self, path, vfstype, dotencode):
Adrian Buehlmann
store: move encode lambda logic into fncachestore...
r17591 if dotencode:
Bryan O'Sullivan
store: switch to C-based hashed path encoding
r18435 encode = _pathencode
Adrian Buehlmann
store: move encode lambda logic into fncachestore...
r17591 else:
encode = _plainhybridencode
Adrian Buehlmann
store: encode first period or space in filenames (issue1713)...
r12687 self.encode = encode
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 vfs = vfstype(path + b'/store')
FUJIWARA Katsunori
store: initialize vfs field first to use it for initialization of others...
r17724 self.path = vfs.base
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 self.pathsep = self.path + b'/'
FUJIWARA Katsunori
store: invoke "os.stat()" for "createmode" initialization via vfs...
r17726 self.createmode = _calcmode(vfs)
FUJIWARA Katsunori
store: rename "op" variables to "vfs"
r17652 vfs.createmode = self.createmode
FUJIWARA Katsunori
store: replace invocation of "getsize()" by "vfs.stat()"...
r17727 self.rawvfs = vfs
FUJIWARA Katsunori
store: rename "op" variables to "vfs"
r17652 fnc = fncache(vfs)
Simon Heimberg
store: eliminate reference cycle in fncachestore...
r9133 self.fncache = fnc
FUJIWARA Katsunori
store: initialize "vfs" fields by "vfs" constructors...
r17653 self.vfs = _fncachevfs(vfs, fnc, encode)
self.opener = self.vfs
Adrian Buehlmann
introduce fncache repository layout...
r7229
def join(self, f):
Bryan O'Sullivan
store: reduce string concatenation when joining...
r17562 return self.pathsep + self.encode(f)
Adrian Buehlmann
introduce fncache repository layout...
r7229
Matt Mackall
store: restore getsize method...
r17731 def getsize(self, path):
return self.rawvfs.stat(path).st_size
Valentin Gatien-Baron
store: return just one filename in walk functions...
r48691 def datafiles(self, matcher=None, undecodable=None):
Bryan O'Sullivan
store: sort the results of fncachestore.datafiles()
r17373 for f in sorted(self.fncache):
Pulkit Goyal
store: introduce _matchtrackedpath() and use it to filter store files...
r40529 if not _matchtrackedpath(f, matcher):
continue
Adrian Buehlmann
store: encode first period or space in filenames (issue1713)...
r12687 ef = self.encode(f)
Adrian Buehlmann
introduce fncache repository layout...
r7229 try:
store: also return some information about the type of file `walk` found...
r47657 t = revlog_type(f)
revlogv2: use a unique filename for data...
r48115 assert t is not None, f
store: also return some information about the type of file `walk` found...
r47657 t |= FILEFLAGS_FILELOG
Valentin Gatien-Baron
store: return just one filename in walk functions...
r48691 yield t, f, self.getsize(ef)
Gregory Szorc
global: mass rewrite to use modern exception syntax...
r25660 except OSError as err:
Bryan O'Sullivan
store: only one kind of OSError means "nonexistent entry"
r17374 if err.errno != errno.ENOENT:
raise
Adrian Buehlmann
introduce fncache repository layout...
r7229
def copylist(self):
Augie Fackler
formatting: blacken the codebase...
r43346 d = (
Pulkit Goyal
store: refactor space delimited list to proper data structure...
r45911 b'bookmarks',
b'narrowspec',
b'data',
b'meta',
b'dh',
b'fncache',
b'phaseroots',
b'obsstore',
b'00manifest.d',
b'00manifest.i',
b'00changelog.d',
b'00changelog.i',
Pulkit Goyal
share: introduce config option to store requires in .hg/store...
r46055 b'requires',
Augie Fackler
formatting: blacken the codebase...
r43346 )
Pulkit Goyal
store: refactor space delimited list to proper data structure...
r45911 return [b'requires', b'00changelog.i'] + [b'store/' + f for f in d]
Adrian Buehlmann
introduce fncache repository layout...
r7229
Durham Goode
fncache: move fncache writing to be in a transaction...
r20883 def write(self, tr):
self.fncache.write(tr)
Adrian Buehlmann
fncachestore: defer updating the fncache file to a single file open...
r13391
Durham Goode
caches: invalidate store caches when lock is taken...
r20884 def invalidatecaches(self):
self.fncache.entries = None
Pulkit Goyal
store: append to fncache if there are only new files to write...
r40767 self.fncache.addls = set()
Durham Goode
caches: invalidate store caches when lock is taken...
r20884
Durham Goode
fncache: clean up fncache during strips...
r20885 def markremoved(self, fn):
self.fncache.remove(fn)
Adrian Buehlmann
store: add new _exists helper function on fncachestore
r17783 def _exists(self, f):
ef = self.encode(f)
try:
self.getsize(ef)
return True
Gregory Szorc
global: mass rewrite to use modern exception syntax...
r25660 except OSError as err:
Adrian Buehlmann
store: add new _exists helper function on fncachestore
r17783 if err.errno != errno.ENOENT:
raise
# nonexistent entry
return False
smuralid
store: add a contains method to fncachestore...
r17745 def __contains__(self, path):
'''Checks if the store contains path'''
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 path = b"/".join((b"data", path))
Adrian Buehlmann
store: move __contains__() implementation from class fncache into fncachestore...
r17782 # check for files (exact match)
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 e = path + b'.i'
Adrian Buehlmann
store: fncache may contain non-existent entries (fixes b9a56b816ff2)
r17784 if e in self.fncache and self._exists(e):
Adrian Buehlmann
store: move __contains__() implementation from class fncache into fncachestore...
r17782 return True
# now check for directories (prefix match)
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 if not path.endswith(b'/'):
path += b'/'
Adrian Buehlmann
store: move __contains__() implementation from class fncache into fncachestore...
r17782 for e in self.fncache:
Adrian Buehlmann
store: fncache may contain non-existent entries (fixes b9a56b816ff2)
r17784 if e.startswith(path) and self._exists(e):
Adrian Buehlmann
store: move __contains__() implementation from class fncache into fncachestore...
r17782 return True
return False