##// END OF EJS Templates
mq: stop using the `pycompat.open()` shim
mq: stop using the `pycompat.open()` shim

File last commit:

r53256:3f0cf7bb default
r53269:e95b0013 default
Show More
store.py
1276 lines | 37.8 KiB | text/x-python | PythonLexer
store: use the revlog type from revlog's constant instead of custom one...
r51573 # store.py - repository store handling for Mercurial)
Adrian Buehlmann
move filename encoding functions from util.py to new store.py
r6839 #
Raphaël Gomès
contributor: change mentions of mpm to olivia...
r47575 # Copyright 2008 Olivia Mackall <olivia@selenic.com>
Adrian Buehlmann
move filename encoding functions from util.py to new store.py
r6839 #
Martin Geisler
updated license to be explicit about GPL version 2
r8225 # This software may be used and distributed according to the terms of the
Matt Mackall
Update license to GPLv2+
r10263 # GNU General Public License version 2 or any later version.
Adrian Buehlmann
move filename encoding functions from util.py to new store.py
r6839
Matt Harbison
typing: add `from __future__ import annotations` to most files...
r52756 from __future__ import annotations
store: add logic to group revlog file together...
r51372 import collections
Pulkit Goyal
store: don't read the whole fncache in memory...
r42144 import functools
Gregory Szorc
store: use absolute_import
r27480 import os
store: exclude `undo.` nodemap's file from `walk`...
r47752 import re
Gregory Szorc
store: use absolute_import
r27480 import stat
Matt Harbison
typing: induce pytype to use the standard `attr` instead of the vendored copy...
r52622 import typing
Matt Harbison
store: fix a signature mismatch for a vfs subclass...
r52775 from typing import (
Generator,
List,
Optional,
)
Gregory Szorc
store: use absolute_import
r27480
from .i18n import _
store: use a StoreEntry object instead of tuple for store files...
r51364 from .thirdparty import attr
Matt Harbison
typing: induce pytype to use the standard `attr` instead of the vendored copy...
r52622
# Force pytype to use the non-vendored package
if typing.TYPE_CHECKING:
# noinspection PyPackageRequirements
import attr
Joerg Sonnenberger
node: import symbols explicitly...
r46729 from .node import hex
Arseniy Alekseyev
stream-clone: avoid opening a revlog in case we do not need it...
r51565 from .revlogutils.constants import (
INDEX_HEADER,
store: use the revlog type from revlog's constant instead of custom one...
r51573 KIND_CHANGELOG,
KIND_FILELOG,
KIND_MANIFESTLOG,
Arseniy Alekseyev
stream-clone: avoid opening a revlog in case we do not need it...
r51565 )
Gregory Szorc
store: use absolute_import
r27480 from . import (
Augie Fackler
localrepo: push manifestlog and changelog construction code into store...
r43175 changelog,
Gregory Szorc
store: use absolute_import
r27480 error,
store: add a `get_revlog_instance` method on revlog entries...
r51520 filelog,
Augie Fackler
localrepo: push manifestlog and changelog construction code into store...
r43175 manifest,
Yuya Nishihara
parsers: switch to policy importer...
r32372 policy,
Mateusz Kwapich
py3: make encodefun in store.py compatible with py3k...
r30077 pycompat,
Arseniy Alekseyev
stream-clone: avoid opening a revlog in case we do not need it...
r51565 revlog as revlogmod,
Gregory Szorc
store: use absolute_import
r27480 util,
Pierre-Yves David
vfs: use 'vfs' module directly in 'mercurial.store'...
r31234 vfs as vfsmod,
Gregory Szorc
store: use absolute_import
r27480 )
Augie Fackler
core: migrate uses of hashlib.sha1 to hashutil.sha1...
r44517 from .utils import hashutil
Adrian Buehlmann
introduce store classes...
r6840
Augie Fackler
cleanup: remove pointless r-prefixes on single-quoted strings...
r43906 parsers = policy.importmod('parsers')
Pulkit Goyal
store: don't read the whole fncache in memory...
r42144 # how much bytes should be read from fncache in one read
# It is done to prevent loading large fncache files into memory
Raphaël Gomès
black: format the codebase with 23.3.0...
r52596 fncache_chunksize = 10**6
Yuya Nishihara
parsers: switch to policy importer...
r32372
Augie Fackler
formatting: blacken the codebase...
r43346
Matt Harbison
typing: disable some pytype errors in `mercurial.store`...
r52621 def _match_tracked_entry(entry: "BaseStoreEntry", matcher):
Pulkit Goyal
store: introduce _matchtrackedpath() and use it to filter store files...
r40529 """parses a fncache entry and returns whether the entry is tracking a path
matched by matcher or not.
If matcher is None, returns True"""
if matcher is None:
return True
Matt Harbison
typing: disable some pytype errors in `mercurial.store`...
r52621
# TODO: make this safe for other entry types. Currently, the various
# store.data_entry generators only yield RevlogStoreEntry, so the
# attributes do exist on `entry`.
# pytype: disable=attribute-error
store: use the boolean property in `store`
r51391 if entry.is_filelog:
store: do the revlog matching on entry directly...
r51387 return matcher(entry.target_id)
store: use the boolean property in `store`
r51391 elif entry.is_manifestlog:
store: do the revlog matching on entry directly...
r51387 return matcher.visitdir(entry.target_id.rstrip(b'/'))
Matt Harbison
typing: disable some pytype errors in `mercurial.store`...
r52621 # pytype: enable=attribute-error
store: do the revlog matching on entry directly...
r51387 raise error.ProgrammingError(b"cannot process entry %r" % entry)
Pulkit Goyal
store: raise ProgrammingError if unable to decode a storage path...
r40658
Augie Fackler
formatting: blacken the codebase...
r43346
Benoit Boissinot
filelog encoding: move the encoding/decoding into store...
r8531 # This avoids a collision between a file named foo and a dir named
# foo.i or foo.d
Adrian Buehlmann
store: use fast C implementation of encodedir() if it's available...
r17607 def _encodedir(path):
Augie Fackler
formating: upgrade to black 20.8b1...
r46554 """
Yuya Nishihara
doctest: bulk-replace string literals with b'' for Python 3...
r34133 >>> _encodedir(b'data/foo.i')
Adrian Buehlmann
store: add some doctests
r13949 'data/foo.i'
Yuya Nishihara
doctest: bulk-replace string literals with b'' for Python 3...
r34133 >>> _encodedir(b'data/foo.i/bla.i')
Adrian Buehlmann
store: add some doctests
r13949 'data/foo.i.hg/bla.i'
Yuya Nishihara
doctest: bulk-replace string literals with b'' for Python 3...
r34133 >>> _encodedir(b'data/foo.i.hg/bla.i')
Adrian Buehlmann
store: add some doctests
r13949 'data/foo.i.hg.hg/bla.i'
Yuya Nishihara
doctest: bulk-replace string literals with b'' for Python 3...
r34133 >>> _encodedir(b'data/foo.i\\ndata/foo.i/bla.i\\ndata/foo.i.hg/bla.i\\n')
Adrian Buehlmann
store: add multiline doctest case for encodedir()...
r17605 'data/foo.i\\ndata/foo.i.hg/bla.i\\ndata/foo.i.hg.hg/bla.i\\n'
Augie Fackler
formating: upgrade to black 20.8b1...
r46554 """
Augie Fackler
formatting: blacken the codebase...
r43346 return (
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 path.replace(b".hg/", b".hg.hg/")
.replace(b".i/", b".i.hg/")
.replace(b".d/", b".d.hg/")
Augie Fackler
formatting: blacken the codebase...
r43346 )
Benoit Boissinot
filelog encoding: move the encoding/decoding into store...
r8531
Adrian Buehlmann
store: use fast C implementation of encodedir() if it's available...
r17607 encodedir = getattr(parsers, 'encodedir', _encodedir)
Augie Fackler
formatting: blacken the codebase...
r43346
Benoit Boissinot
filelog encoding: move the encoding/decoding into store...
r8531 def decodedir(path):
Augie Fackler
formating: upgrade to black 20.8b1...
r46554 """
Yuya Nishihara
doctest: bulk-replace string literals with b'' for Python 3...
r34133 >>> decodedir(b'data/foo.i')
Adrian Buehlmann
store: add some doctests
r13949 'data/foo.i'
Yuya Nishihara
doctest: bulk-replace string literals with b'' for Python 3...
r34133 >>> decodedir(b'data/foo.i.hg/bla.i')
Adrian Buehlmann
store: add some doctests
r13949 'data/foo.i/bla.i'
Yuya Nishihara
doctest: bulk-replace string literals with b'' for Python 3...
r34133 >>> decodedir(b'data/foo.i.hg.hg/bla.i')
Adrian Buehlmann
store: add some doctests
r13949 'data/foo.i.hg/bla.i'
Augie Fackler
formating: upgrade to black 20.8b1...
r46554 """
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 if b".hg/" not in path:
Benoit Boissinot
filelog encoding: move the encoding/decoding into store...
r8531 return path
Augie Fackler
formatting: blacken the codebase...
r43346 return (
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 path.replace(b".d.hg/", b".d/")
.replace(b".i.hg/", b".i/")
.replace(b".hg.hg/", b".hg/")
Augie Fackler
formatting: blacken the codebase...
r43346 )
Benoit Boissinot
filelog encoding: move the encoding/decoding into store...
r8531
timeless
store: treat range as a generator instead of a list for py3 compat
r29071 def _reserved():
Augie Fackler
formating: upgrade to black 20.8b1...
r46554 """characters that are problematic for filesystems
timeless
store: treat range as a generator instead of a list for py3 compat
r29071
* ascii escapes (0..31)
* ascii hi (126..255)
* windows specials
these characters will be escaped by encodefunctions
Augie Fackler
formating: upgrade to black 20.8b1...
r46554 """
Mateusz Kwapich
py3: make the string unicode so its iterable in py3k
r30076 winreserved = [ord(x) for x in u'\\:*?"<>|']
timeless
store: treat range as a generator instead of a list for py3 compat
r29071 for x in range(32):
yield x
for x in range(126, 256):
yield x
for x in winreserved:
yield x
Augie Fackler
formatting: blacken the codebase...
r43346
Adrian Buehlmann
move filename encoding functions from util.py to new store.py
r6839 def _buildencodefun():
Augie Fackler
formating: upgrade to black 20.8b1...
r46554 """
Adrian Buehlmann
store: add some doctests
r13949 >>> enc, dec = _buildencodefun()
Yuya Nishihara
doctest: bulk-replace string literals with b'' for Python 3...
r34133 >>> enc(b'nothing/special.txt')
Adrian Buehlmann
store: add some doctests
r13949 'nothing/special.txt'
Yuya Nishihara
doctest: bulk-replace string literals with b'' for Python 3...
r34133 >>> dec(b'nothing/special.txt')
Adrian Buehlmann
store: add some doctests
r13949 'nothing/special.txt'
Yuya Nishihara
doctest: bulk-replace string literals with b'' for Python 3...
r34133 >>> enc(b'HELLO')
Adrian Buehlmann
store: add some doctests
r13949 '_h_e_l_l_o'
Yuya Nishihara
doctest: bulk-replace string literals with b'' for Python 3...
r34133 >>> dec(b'_h_e_l_l_o')
Adrian Buehlmann
store: add some doctests
r13949 'HELLO'
Yuya Nishihara
doctest: bulk-replace string literals with b'' for Python 3...
r34133 >>> enc(b'hello:world?')
Adrian Buehlmann
store: add some doctests
r13949 'hello~3aworld~3f'
Yuya Nishihara
doctest: bulk-replace string literals with b'' for Python 3...
r34133 >>> dec(b'hello~3aworld~3f')
Adrian Buehlmann
store: add some doctests
r13949 'hello:world?'
Yuya Nishihara
doctest: do not embed non-ascii characters in docstring...
r34138 >>> enc(b'the\\x07quick\\xADshot')
Adrian Buehlmann
store: add some doctests
r13949 'the~07quick~adshot'
Yuya Nishihara
doctest: bulk-replace string literals with b'' for Python 3...
r34133 >>> dec(b'the~07quick~adshot')
Adrian Buehlmann
store: add some doctests
r13949 'the\\x07quick\\xadshot'
Augie Fackler
formating: upgrade to black 20.8b1...
r46554 """
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 e = b'_'
Yuya Nishihara
py3: factor out bytechr() function...
r31253 xchr = pycompat.bytechr
asciistr = list(map(xchr, range(127)))
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 capitals = list(range(ord(b"A"), ord(b"Z") + 1))
Mateusz Kwapich
py3: make encodefun in store.py compatible with py3k...
r30077
Augie Fackler
cleanup: run pyupgrade on our source tree to clean up varying things...
r44937 cmap = {x: x for x in asciistr}
timeless
store: treat range as a generator instead of a list for py3 compat
r29071 for x in _reserved():
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 cmap[xchr(x)] = b"~%02x" % x
Mateusz Kwapich
py3: make encodefun in store.py compatible with py3k...
r30077 for x in capitals + [ord(e)]:
cmap[xchr(x)] = e + xchr(x).lower()
Adrian Buehlmann
move filename encoding functions from util.py to new store.py
r6839 dmap = {}
Gregory Szorc
global: bulk replace simple pycompat.iteritems(x) with x.items()...
r49768 for k, v in cmap.items():
Adrian Buehlmann
move filename encoding functions from util.py to new store.py
r6839 dmap[v] = k
Augie Fackler
formatting: blacken the codebase...
r43346
Adrian Buehlmann
move filename encoding functions from util.py to new store.py
r6839 def decode(s):
i = 0
while i < len(s):
Manuel Jacob
py3: replace `pycompat.xrange` by `range`
r50179 for l in range(1, 4):
Adrian Buehlmann
move filename encoding functions from util.py to new store.py
r6839 try:
Augie Fackler
formatting: blacken the codebase...
r43346 yield dmap[s[i : i + l]]
Adrian Buehlmann
move filename encoding functions from util.py to new store.py
r6839 i += l
break
except KeyError:
pass
else:
raise KeyError
Augie Fackler
formatting: blacken the codebase...
r43346
return (
Manuel Jacob
py3: replace `pycompat.xrange` by `range`
r50179 lambda s: b''.join([cmap[s[c : c + 1]] for c in range(len(s))]),
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 lambda s: b''.join(list(decode(s))),
Augie Fackler
formatting: blacken the codebase...
r43346 )
Adrian Buehlmann
store: extract functions _encodefname and _decodefname
r17608
_encodefname, _decodefname = _buildencodefun()
Adrian Buehlmann
move filename encoding functions from util.py to new store.py
r6839
Augie Fackler
formatting: blacken the codebase...
r43346
Adrian Buehlmann
store: extract functions _encodefname and _decodefname
r17608 def encodefilename(s):
Augie Fackler
formating: upgrade to black 20.8b1...
r46554 """
Yuya Nishihara
doctest: bulk-replace string literals with b'' for Python 3...
r34133 >>> encodefilename(b'foo.i/bar.d/bla.hg/hi:world?/HELLO')
Adrian Buehlmann
store: extract functions _encodefname and _decodefname
r17608 'foo.i.hg/bar.d.hg/bla.hg.hg/hi~3aworld~3f/_h_e_l_l_o'
Augie Fackler
formating: upgrade to black 20.8b1...
r46554 """
Adrian Buehlmann
store: extract functions _encodefname and _decodefname
r17608 return _encodefname(encodedir(s))
Augie Fackler
formatting: blacken the codebase...
r43346
Adrian Buehlmann
store: extract functions _encodefname and _decodefname
r17608 def decodefilename(s):
Augie Fackler
formating: upgrade to black 20.8b1...
r46554 """
Yuya Nishihara
doctest: bulk-replace string literals with b'' for Python 3...
r34133 >>> decodefilename(b'foo.i.hg/bar.d.hg/bla.hg.hg/hi~3aworld~3f/_h_e_l_l_o')
Adrian Buehlmann
store: extract functions _encodefname and _decodefname
r17608 'foo.i/bar.d/bla.hg/hi:world?/HELLO'
Augie Fackler
formating: upgrade to black 20.8b1...
r46554 """
Adrian Buehlmann
store: extract functions _encodefname and _decodefname
r17608 return decodedir(_decodefname(s))
Adrian Buehlmann
move filename encoding functions from util.py to new store.py
r6839
Augie Fackler
formatting: blacken the codebase...
r43346
Adrian Buehlmann
store: change names to comply with project coding standards...
r14288 def _buildlowerencodefun():
Augie Fackler
formating: upgrade to black 20.8b1...
r46554 """
Adrian Buehlmann
store: change names to comply with project coding standards...
r14288 >>> f = _buildlowerencodefun()
Yuya Nishihara
doctest: bulk-replace string literals with b'' for Python 3...
r34133 >>> f(b'nothing/special.txt')
Adrian Buehlmann
store: add some doctests
r13949 'nothing/special.txt'
Yuya Nishihara
doctest: bulk-replace string literals with b'' for Python 3...
r34133 >>> f(b'HELLO')
Adrian Buehlmann
store: add some doctests
r13949 'hello'
Yuya Nishihara
doctest: bulk-replace string literals with b'' for Python 3...
r34133 >>> f(b'hello:world?')
Adrian Buehlmann
store: add some doctests
r13949 'hello~3aworld~3f'
Yuya Nishihara
doctest: do not embed non-ascii characters in docstring...
r34138 >>> f(b'the\\x07quick\\xADshot')
Adrian Buehlmann
store: add some doctests
r13949 'the~07quick~adshot'
Augie Fackler
formating: upgrade to black 20.8b1...
r46554 """
Yuya Nishihara
py3: use bytechr() in store._buildlowerencodefun()
r34211 xchr = pycompat.bytechr
Manuel Jacob
py3: replace `pycompat.xrange` by `range`
r50179 cmap = {xchr(x): xchr(x) for x in range(127)}
timeless
store: treat range as a generator instead of a list for py3 compat
r29071 for x in _reserved():
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 cmap[xchr(x)] = b"~%02x" % x
for x in range(ord(b"A"), ord(b"Z") + 1):
Yuya Nishihara
py3: use bytechr() in store._buildlowerencodefun()
r34211 cmap[xchr(x)] = xchr(x).lower()
Augie Fackler
formatting: blacken the codebase...
r43346
Yuya Nishihara
store: give name to lowerencode function...
r34210 def lowerencode(s):
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 return b"".join([cmap[c] for c in pycompat.iterbytestr(s)])
Augie Fackler
formatting: blacken the codebase...
r43346
Yuya Nishihara
store: give name to lowerencode function...
r34210 return lowerencode
Adrian Buehlmann
introduce fncache repository layout...
r7229
Augie Fackler
formatting: blacken the codebase...
r43346
Bryan O'Sullivan
store: implement lowerencode in C
r18430 lowerencode = getattr(parsers, 'lowerencode', None) or _buildlowerencodefun()
Adrian Buehlmann
introduce fncache repository layout...
r7229
Adrian Buehlmann
store: optimze _auxencode() a bit by grouping the reserved names by length...
r17570 # Windows reserved names: con, prn, aux, nul, com1..com9, lpt1..lpt9
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 _winres3 = (b'aux', b'con', b'prn', b'nul') # length 3
_winres4 = (b'com', b'lpt') # length 4 (with trailing 1..9)
Augie Fackler
formatting: blacken the codebase...
r43346
Adrian Buehlmann
store: encode first period or space in filenames (issue1713)...
r12687 def _auxencode(path, dotencode):
Augie Fackler
formating: upgrade to black 20.8b1...
r46554 """
Adrian Buehlmann
store: add some doctests
r13949 Encodes filenames containing names reserved by Windows or which end in
period or space. Does not touch other single reserved characters c.
Specifically, c in '\\:*?"<>|' or ord(c) <= 31 are *not* encoded here.
Additionally encodes space or period at the beginning, if dotencode is
Adrian Buehlmann
store: explain "aux.foo" versus "foo.aux" in doc of _auxencode()
r17569 True. Parameter path is assumed to be all lowercase.
A segment only needs encoding if a reserved name appears as a
basename (e.g. "aux", "aux.foo"). A directory or file named "foo.aux"
doesn't need encoding.
Adrian Buehlmann
store: add some doctests
r13949
Yuya Nishihara
doctest: bulk-replace string literals with b'' for Python 3...
r34133 >>> s = b'.foo/aux.txt/txt.aux/con/prn/nul/foo.'
>>> _auxencode(s.split(b'/'), True)
Adrian Buehlmann
store: let _auxencode() return the list of path segments...
r17574 ['~2efoo', 'au~78.txt', 'txt.aux', 'co~6e', 'pr~6e', 'nu~6c', 'foo~2e']
Yuya Nishihara
doctest: bulk-replace string literals with b'' for Python 3...
r34133 >>> s = b'.com1com2/lpt9.lpt4.lpt1/conprn/com0/lpt0/foo.'
>>> _auxencode(s.split(b'/'), False)
Adrian Buehlmann
store: let _auxencode() return the list of path segments...
r17574 ['.com1com2', 'lp~749.lpt4.lpt1', 'conprn', 'com0', 'lpt0', 'foo~2e']
Yuya Nishihara
doctest: bulk-replace string literals with b'' for Python 3...
r34133 >>> _auxencode([b'foo. '], True)
Adrian Buehlmann
store: let _auxencode() return the list of path segments...
r17574 ['foo.~20']
Yuya Nishihara
doctest: bulk-replace string literals with b'' for Python 3...
r34133 >>> _auxencode([b' .foo'], True)
Adrian Buehlmann
store: let _auxencode() return the list of path segments...
r17574 ['~20.foo']
Augie Fackler
formating: upgrade to black 20.8b1...
r46554 """
Adrian Buehlmann
store: parameter path of _auxencode is now a list of strings
r17589 for i, n in enumerate(path):
Adrian Buehlmann
store: unindent most of the contents of the for loop in _auxencode()...
r17572 if not n:
continue
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 if dotencode and n[0] in b'. ':
n = b"~%02x" % ord(n[0:1]) + n[1:]
Adrian Buehlmann
store: parameter path of _auxencode is now a list of strings
r17589 path[i] = n
Adrian Buehlmann
store: unindent most of the contents of the for loop in _auxencode()...
r17572 else:
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 l = n.find(b'.')
Adrian Buehlmann
store: unindent most of the contents of the for loop in _auxencode()...
r17572 if l == -1:
l = len(n)
Augie Fackler
formatting: blacken the codebase...
r43346 if (l == 3 and n[:3] in _winres3) or (
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 l == 4
and n[3:4] <= b'9'
and n[3:4] >= b'1'
and n[:3] in _winres4
Augie Fackler
formatting: blacken the codebase...
r43346 ):
Adrian Buehlmann
store: unindent most of the contents of the for loop in _auxencode()...
r17572 # encode third letter ('aux' -> 'au~78')
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 ec = b"~%02x" % ord(n[2:3])
Adrian Buehlmann
store: unindent most of the contents of the for loop in _auxencode()...
r17572 n = n[0:2] + ec + n[3:]
Adrian Buehlmann
store: parameter path of _auxencode is now a list of strings
r17589 path[i] = n
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 if n[-1] in b'. ':
Adrian Buehlmann
store: unindent most of the contents of the for loop in _auxencode()...
r17572 # encode last period or space ('foo...' -> 'foo..~2e')
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 path[i] = n[:-1] + b"~%02x" % ord(n[-1:])
Adrian Buehlmann
store: parameter path of _auxencode is now a list of strings
r17589 return path
Adrian Buehlmann
introduce fncache repository layout...
r7229
Augie Fackler
formatting: blacken the codebase...
r43346
Adrian Buehlmann
store: change names to comply with project coding standards...
r14288 _maxstorepathlen = 120
_dirprefixlen = 8
_maxshortdirslen = 8 * (_dirprefixlen + 1) - 4
Bryan O'Sullivan
store: refactor hashed encoding into its own function
r17610
Augie Fackler
formatting: blacken the codebase...
r43346
Bryan O'Sullivan
store: refactor hashed encoding into its own function
r17610 def _hashencode(path, dotencode):
Joerg Sonnenberger
node: import symbols explicitly...
r46729 digest = hex(hashutil.sha1(path).digest())
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 le = lowerencode(path[5:]).split(b'/') # skips prefix 'data/' or 'meta/'
Bryan O'Sullivan
store: refactor hashed encoding into its own function
r17610 parts = _auxencode(le, dotencode)
basename = parts[-1]
_root, ext = os.path.splitext(basename)
sdirs = []
sdirslen = 0
for p in parts[:-1]:
d = p[:_dirprefixlen]
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 if d[-1] in b'. ':
Bryan O'Sullivan
store: refactor hashed encoding into its own function
r17610 # Windows can't access dirs ending in period or space
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 d = d[:-1] + b'_'
Bryan O'Sullivan
store: refactor hashed encoding into its own function
r17610 if sdirslen == 0:
t = len(d)
else:
t = sdirslen + 1 + len(d)
if t > _maxshortdirslen:
break
sdirs.append(d)
sdirslen = t
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 dirs = b'/'.join(sdirs)
Bryan O'Sullivan
store: refactor hashed encoding into its own function
r17610 if len(dirs) > 0:
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 dirs += b'/'
res = b'dh/' + dirs + digest + ext
Bryan O'Sullivan
store: refactor hashed encoding into its own function
r17610 spaceleft = _maxstorepathlen - len(res)
if spaceleft > 0:
filler = basename[:spaceleft]
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 res = b'dh/' + dirs + filler + digest + ext
Bryan O'Sullivan
store: refactor hashed encoding into its own function
r17610 return res
Augie Fackler
formatting: blacken the codebase...
r43346
Adrian Buehlmann
store: eliminate one level of lambda functions on _hybridencode
r17590 def _hybridencode(path, dotencode):
Augie Fackler
formating: upgrade to black 20.8b1...
r46554 """encodes path with a length limit
Adrian Buehlmann
introduce fncache repository layout...
r7229
Encodes all paths that begin with 'data/', according to the following.
Default encoding (reversible):
Encodes all uppercase letters 'X' as '_x'. All reserved or illegal
characters are encoded as '~xx', where xx is the two digit hex code
of the character (see encodefilename).
Relevant path components consisting of Windows reserved filenames are
Mads Kiilerich
spelling: fix minor spell checker issues
r17738 masked by encoding the third character ('aux' -> 'au~78', see _auxencode).
Adrian Buehlmann
introduce fncache repository layout...
r7229
Hashed encoding (not reversible):
Adrian Buehlmann
store: change names to comply with project coding standards...
r14288 If the default-encoded path is longer than _maxstorepathlen, a
Adrian Buehlmann
introduce fncache repository layout...
r7229 non-reversible hybrid hashing of the path is done instead.
Adrian Buehlmann
store: change names to comply with project coding standards...
r14288 This encoding uses up to _dirprefixlen characters of all directory
Adrian Buehlmann
introduce fncache repository layout...
r7229 levels of the lowerencoded path, but not more levels than can fit into
Adrian Buehlmann
store: change names to comply with project coding standards...
r14288 _maxshortdirslen.
Adrian Buehlmann
introduce fncache repository layout...
r7229 Then follows the filler followed by the sha digest of the full path.
The filler is the beginning of the basename of the lowerencoded path
(the basename is everything after the last path separator). The filler
is as long as possible, filling in characters from the basename until
Adrian Buehlmann
store: change names to comply with project coding standards...
r14288 the encoded path has _maxstorepathlen characters (or all chars of the
basename have been taken).
Adrian Buehlmann
introduce fncache repository layout...
r7229 The extension (e.g. '.i' or '.d') is preserved.
The string 'data/' at the beginning is replaced with 'dh/', if the hashed
encoding was used.
Augie Fackler
formating: upgrade to black 20.8b1...
r46554 """
Adrian Buehlmann
store: reuse direncoded path in _hybridencode...
r17609 path = encodedir(path)
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 ef = _encodefname(path).split(b'/')
res = b'/'.join(_auxencode(ef, dotencode))
Adrian Buehlmann
store: change names to comply with project coding standards...
r14288 if len(res) > _maxstorepathlen:
Bryan O'Sullivan
store: refactor hashed encoding into its own function
r17610 res = _hashencode(path, dotencode)
Adrian Buehlmann
introduce fncache repository layout...
r7229 return res
Augie Fackler
formatting: blacken the codebase...
r43346
Adrian Buehlmann
store: add a fallback _pathencode Python function...
r17624 def _pathencode(path):
Bryan O'Sullivan
store: switch to C-based hashed path encoding
r18435 de = encodedir(path)
Adrian Buehlmann
store: optimize _pathencode by checking the length of the unencoded path...
r17693 if len(path) > _maxstorepathlen:
Bryan O'Sullivan
store: switch to C-based hashed path encoding
r18435 return _hashencode(de, True)
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 ef = _encodefname(de).split(b'/')
res = b'/'.join(_auxencode(ef, True))
Adrian Buehlmann
store: add a fallback _pathencode Python function...
r17624 if len(res) > _maxstorepathlen:
Bryan O'Sullivan
store: switch to C-based hashed path encoding
r18435 return _hashencode(de, True)
Adrian Buehlmann
store: add a fallback _pathencode Python function...
r17624 return res
Augie Fackler
formatting: blacken the codebase...
r43346
Adrian Buehlmann
store: add a fallback _pathencode Python function...
r17624 _pathencode = getattr(parsers, 'pathencode', _pathencode)
Augie Fackler
formatting: blacken the codebase...
r43346
Adrian Buehlmann
store: move _plainhybridencode and _dothybridencode higher up in the file...
r17623 def _plainhybridencode(f):
return _hybridencode(f, False)
Augie Fackler
formatting: blacken the codebase...
r43346
FUJIWARA Katsunori
store: invoke "os.stat()" for "createmode" initialization via vfs...
r17726 def _calcmode(vfs):
Matt Mackall
store: simplify class hierarchy
r6898 try:
# files in .hg/ will be created using this mode
FUJIWARA Katsunori
store: invoke "os.stat()" for "createmode" initialization via vfs...
r17726 mode = vfs.stat().st_mode
Augie Fackler
formatting: blacken the codebase...
r43346 # avoid some useless chmods
Gregory Szorc
global: mass rewrite to use modern octal syntax...
r25658 if (0o777 & ~util.umask) == (0o777 & mode):
Matt Mackall
store: simplify class hierarchy
r6898 mode = None
except OSError:
mode = None
return mode
Augie Fackler
formatting: blacken the codebase...
r43346
Pulkit Goyal
store: refactor space delimited list to proper data structure...
r45911 _data = [
b'bookmarks',
b'narrowspec',
b'data',
b'meta',
b'00manifest.d',
b'00manifest.i',
b'00changelog.d',
b'00changelog.i',
b'phaseroots',
b'obsstore',
Pulkit Goyal
share: introduce config option to store requires in .hg/store...
r46055 b'requires',
Pulkit Goyal
store: refactor space delimited list to proper data structure...
r45911 ]
Augie Fackler
formatting: blacken the codebase...
r43346
store: stop relying on a `revlog_type` property...
r51564 REVLOG_FILES_EXT = (
b'.i',
revlogv2: use a unique filename for data...
r48115 b'.idx',
b'.d',
b'.dat',
b'.n',
b'.nd',
revlog: store sidedata in their own file...
r48181 b'.sda',
revlogv2: use a unique filename for data...
r48115 )
store: add logic to group revlog file together...
r51372 # file extension that also use a `-SOMELONGIDHASH.ext` form
REVLOG_FILES_LONG_EXT = (
b'.nd',
b'.idx',
b'.dat',
b'.sda',
)
streamclone: treat volatile file as "fullfile"...
r47751 # files that are "volatile" and might change between listing and streaming
#
# note: the ".nd" file are nodemap data and won't "change" but they might be
# deleted.
REVLOG_FILES_VOLATILE_EXT = (b'.n', b'.nd')
store: also return some information about the type of file `walk` found...
r47657
store: exclude `undo.` nodemap's file from `walk`...
r47752 # some exception to the above matching
walk: no longer ignore revlogs of files starting with `undo.` (issue6542)...
r48459 #
# XXX This is currently not in use because of issue6542
Mads Kiilerich
py3: fix for Python 3.12 emitting SyntaxWarning on invalid escape sequences...
r51245 EXCLUDED = re.compile(br'.*undo\.[^/]+\.(nd?|i)$')
store: exclude `undo.` nodemap's file from `walk`...
r47752
store: also return some information about the type of file `walk` found...
r47657
def is_revlog(f, kind, st):
if kind != stat.S_IFREG:
store: stop relying on a `revlog_type` property...
r51564 return False
if f.endswith(REVLOG_FILES_EXT):
return True
return False
store: also return some information about the type of file `walk` found...
r47657
store: stop relying on a `revlog_type` property...
r51564 def is_revlog_file(f):
if f.endswith(REVLOG_FILES_EXT):
return True
return False
store: use `endswith` to detect revlog extension...
r47112
Matt Mackall
clone: get a list of files to clone from store
r6903
store: declare a `files` method on BaseStoreEntry...
r51531 @attr.s(slots=True)
class StoreFile:
"""a file matching a store entry"""
unencoded_path = attr.ib()
_file_size = attr.ib(default=None)
is_volatile = attr.ib(default=False)
stream: preserve volatile cache early...
r53256 # Missing file can be safely ignored, used by "copy/hardlink" local clone
# for cache file not covered by lock.
optional = False
store: declare a `files` method on BaseStoreEntry...
r51531
def file_size(self, vfs):
if self._file_size is None:
stream-clone: make it the responsability of the store entry to stream content...
r51532 if vfs is None:
msg = b"calling vfs-less file_size without prior call: %s"
msg %= self.unencoded_path
raise error.ProgrammingError(msg)
store: declare a `files` method on BaseStoreEntry...
r51531 try:
self._file_size = vfs.stat(self.unencoded_path).st_size
except FileNotFoundError:
self._file_size = 0
return self._file_size
stream: in v3, skip the "size" fast path if the entries as some unknown size...
r52440 @property
def has_size(self):
return self._file_size is not None
stream: rename TempCopyManager to VolatileManager...
r52909 def get_stream(self, vfs, volatiles):
stream-clone: make it the responsability of the store entry to stream content...
r51532 """return data "stream" information for this file
(unencoded_file_path, content_iterator, content_size)
"""
size = self.file_size(None)
def get_stream():
stream: open volatile file through the manager...
r52910 path = vfs.join(self.unencoded_path)
with volatiles.open(path) as fp:
stream-clone: make it the responsability of the store entry to stream content...
r51532 yield None # ready to stream
if size <= 65536:
yield fp.read(size)
else:
yield from util.filechunkiter(fp, limit=size)
s = get_stream()
next(s)
return (self.unencoded_path, s, size)
store: declare a `files` method on BaseStoreEntry...
r51531
store: have custom init for entries class...
r51367 @attr.s(slots=True, init=False)
store: use specialized class for store entries...
r51366 class BaseStoreEntry:
store: use a StoreEntry object instead of tuple for store files...
r51364 """An entry in the store
This is returned by `store.walk` and represent some data in the store."""
streamclone: stop listing files for entries that have no volatile files...
r52445 maybe_volatile = True
store: declare a `files` method on BaseStoreEntry...
r51531 def files(self) -> List[StoreFile]:
raise NotImplementedError
stream-clone: implement decidated `get_streams` method for revlog...
r51533 def get_streams(
self,
repo=None,
vfs=None,
stream: rename TempCopyManager to VolatileManager...
r52909 volatiles=None,
stream-clone: implement decidated `get_streams` method for revlog...
r51533 max_changeset=None,
Arseniy Alekseyev
stream-clone: add a v3 version of the protocol...
r51599 preserve_file_count=False,
stream-clone: implement decidated `get_streams` method for revlog...
r51533 ):
stream-clone: make it the responsability of the store entry to stream content...
r51532 """return a list of data stream associated to files for this entry
return [(unencoded_file_path, content_iterator, content_size), …]
"""
assert vfs is not None
stream: rename TempCopyManager to VolatileManager...
r52909 return [f.get_stream(vfs, volatiles) for f in self.files()]
stream-clone: make it the responsability of the store entry to stream content...
r51532
stream: create a `e.preserve_volatiles` method directly on StoreEntry...
r53254 def preserve_volatiles(self, vfs, volatiles):
"""Use a VolatileManager to preserve the state of any volatile file
This is useful for code that need a consistent view of the content like stream clone.
"""
if self.maybe_volatile:
for f in self.files():
if f.is_volatile:
volatiles(vfs.join(f.unencoded_path))
store: issue a single entry for each revlog...
r51389
@attr.s(slots=True, init=False)
class SimpleStoreEntry(BaseStoreEntry):
"""A generic entry in the store"""
is_revlog = False
streamclone: stop listing files for entries that have no volatile files...
r52445 maybe_volatile = attr.ib()
store: rename `unencoded_path` to `entry_path` for StoreEntry...
r51388 _entry_path = attr.ib()
store: only access is_volatile information through the file object...
r51369 _is_volatile = attr.ib(default=False)
store: only access file_size information through the file object...
r51368 _file_size = attr.ib(default=None)
store: cache the `files()` return for store entries...
r51524 _files = attr.ib(default=None)
store: use a StoreEntry object instead of tuple for store files...
r51364
store: have custom init for entries class...
r51367 def __init__(
self,
store: rename `unencoded_path` to `entry_path` for StoreEntry...
r51388 entry_path,
store: have custom init for entries class...
r51367 is_volatile=False,
file_size=None,
):
store: issue a single entry for each revlog...
r51389 super().__init__()
store: rename `unencoded_path` to `entry_path` for StoreEntry...
r51388 self._entry_path = entry_path
store: only access is_volatile information through the file object...
r51369 self._is_volatile = is_volatile
store: only access file_size information through the file object...
r51368 self._file_size = file_size
store: cache the `files()` return for store entries...
r51524 self._files = None
streamclone: stop listing files for entries that have no volatile files...
r52445 self.maybe_volatile = is_volatile
store: have custom init for entries class...
r51367
store: declare a `files` method on BaseStoreEntry...
r51531 def files(self) -> List[StoreFile]:
store: cache the `files()` return for store entries...
r51524 if self._files is None:
self._files = [
StoreFile(
unencoded_path=self._entry_path,
file_size=self._file_size,
is_volatile=self._is_volatile,
)
]
return self._files
store: introduce a EntryFile object to actually access file info...
r51365
store: have custom init for entries class...
r51367 @attr.s(slots=True, init=False)
store: use specialized class for store entries...
r51366 class RevlogStoreEntry(BaseStoreEntry):
"""A revlog entry in the store"""
is_revlog = True
store: issue a single entry for each revlog...
r51389
store: use specialized class for store entries...
r51366 revlog_type = attr.ib(default=None)
store: add a `target_id` attribute on RevlogStoreEntry...
r51376 target_id = attr.ib(default=None)
streamclone: stop listing files for entries that have no volatile files...
r52445 maybe_volatile = attr.ib(default=True)
store: issue a single entry for each revlog...
r51389 _path_prefix = attr.ib(default=None)
_details = attr.ib(default=None)
store: cache the `files()` return for store entries...
r51524 _files = attr.ib(default=None)
store: use specialized class for store entries...
r51366
store: have custom init for entries class...
r51367 def __init__(
self,
revlog_type,
store: issue a single entry for each revlog...
r51389 path_prefix,
store: add a `target_id` attribute on RevlogStoreEntry...
r51376 target_id,
store: issue a single entry for each revlog...
r51389 details,
store: have custom init for entries class...
r51367 ):
store: issue a single entry for each revlog...
r51389 super().__init__()
store: have custom init for entries class...
r51367 self.revlog_type = revlog_type
store: add a `target_id` attribute on RevlogStoreEntry...
r51376 self.target_id = target_id
store: issue a single entry for each revlog...
r51389 self._path_prefix = path_prefix
assert b'.i' in details, (path_prefix, details)
streamclone: stop listing files for entries that have no volatile files...
r52445 for ext in details:
if ext.endswith(REVLOG_FILES_VOLATILE_EXT):
self.maybe_volatile = True
break
else:
self.maybe_volatile = False
store: issue a single entry for each revlog...
r51389 self._details = details
store: cache the `files()` return for store entries...
r51524 self._files = None
store: have custom init for entries class...
r51367
store: introduce boolean property for revlog type...
r51390 @property
def is_changelog(self):
store: use the revlog type from revlog's constant instead of custom one...
r51573 return self.revlog_type == KIND_CHANGELOG
store: introduce boolean property for revlog type...
r51390
@property
def is_manifestlog(self):
store: use the revlog type from revlog's constant instead of custom one...
r51573 return self.revlog_type == KIND_MANIFESTLOG
store: introduce boolean property for revlog type...
r51390
@property
def is_filelog(self):
store: use the revlog type from revlog's constant instead of custom one...
r51573 return self.revlog_type == KIND_FILELOG
store: introduce boolean property for revlog type...
r51390
store: introduce a main_file_path method for revlog...
r51385 def main_file_path(self):
"""unencoded path of the main revlog file"""
store: issue a single entry for each revlog...
r51389 return self._path_prefix + b'.i'
store: declare a `files` method on BaseStoreEntry...
r51531 def files(self) -> List[StoreFile]:
store: cache the `files()` return for store entries...
r51524 if self._files is None:
self._files = []
for ext in sorted(self._details, key=_ext_key):
path = self._path_prefix + ext
store: directly pass the filesize in the `details` of revlog...
r51563 file_size = self._details[ext]
store: have the revlog determine which files are volatile itself...
r51561 # files that are "volatile" and might change between
# listing and streaming
#
# note: the ".nd" file are nodemap data and won't "change"
# but they might be deleted.
volatile = ext.endswith(REVLOG_FILES_VOLATILE_EXT)
store: explicitly pass file_size when creating StoreFile...
r51562 f = StoreFile(path, file_size, volatile)
store: have the revlog determine which files are volatile itself...
r51561 self._files.append(f)
store: cache the `files()` return for store entries...
r51524 return self._files
store: introduce a main_file_path method for revlog...
r51385
stream-clone: implement decidated `get_streams` method for revlog...
r51533 def get_streams(
self,
repo=None,
vfs=None,
stream: rename TempCopyManager to VolatileManager...
r52909 volatiles=None,
stream-clone: implement decidated `get_streams` method for revlog...
r51533 max_changeset=None,
Arseniy Alekseyev
stream-clone: add a v3 version of the protocol...
r51599 preserve_file_count=False,
stream-clone: implement decidated `get_streams` method for revlog...
r51533 ):
stream: in v3, skip the "size" fast path if the entries as some unknown size...
r52440 pre_sized = all(f.has_size for f in self.files())
if pre_sized and (
Arseniy Alekseyev
stream-clone: avoid opening a revlog in case we do not need it...
r51565 repo is None
or max_changeset is None
stream-clone: implement decidated `get_streams` method for revlog...
r51533 # This use revlog-v2, ignore for now
Arseniy Alekseyev
stream-clone: avoid opening a revlog in case we do not need it...
r51565 or any(k.endswith(b'.idx') for k in self._details.keys())
# This is not inline, no race expected
or b'.d' in self._details
):
stream-clone: implement decidated `get_streams` method for revlog...
r51533 return super().get_streams(
repo=repo,
vfs=vfs,
stream: rename TempCopyManager to VolatileManager...
r52909 volatiles=volatiles,
stream-clone: implement decidated `get_streams` method for revlog...
r51533 max_changeset=max_changeset,
Arseniy Alekseyev
stream-clone: add a v3 version of the protocol...
r51599 preserve_file_count=preserve_file_count,
stream-clone: implement decidated `get_streams` method for revlog...
r51533 )
Arseniy Alekseyev
stream-clone: add a v3 version of the protocol...
r51599 elif not preserve_file_count:
stream = [
stream: rename TempCopyManager to VolatileManager...
r52909 f.get_stream(vfs, volatiles)
Arseniy Alekseyev
stream-clone: add a v3 version of the protocol...
r51599 for f in self.files()
if not f.unencoded_path.endswith((b'.i', b'.d'))
]
rl = self.get_revlog_instance(repo).get_revlog()
rl_stream = rl.get_streams(max_changeset)
stream.extend(rl_stream)
return stream
Arseniy Alekseyev
stream-clone: avoid opening a revlog in case we do not need it...
r51565
stream-clone: implement decidated `get_streams` method for revlog...
r51533 name_to_size = {}
for f in self.files():
name_to_size[f.unencoded_path] = f.file_size(None)
Arseniy Alekseyev
stream-clone: avoid opening a revlog in case we do not need it...
r51565
stream-clone: implement decidated `get_streams` method for revlog...
r51533 stream = [
stream: rename TempCopyManager to VolatileManager...
r52909 f.get_stream(vfs, volatiles)
stream-clone: implement decidated `get_streams` method for revlog...
r51533 for f in self.files()
Arseniy Alekseyev
stream-clone: avoid opening a revlog in case we do not need it...
r51565 if not f.unencoded_path.endswith(b'.i')
stream-clone: implement decidated `get_streams` method for revlog...
r51533 ]
Arseniy Alekseyev
stream-clone: avoid opening a revlog in case we do not need it...
r51565 index_path = self._path_prefix + b'.i'
stream-clone: smoothly detect and handle a case were a revlog is split...
r51534
Arseniy Alekseyev
stream-clone: avoid opening a revlog in case we do not need it...
r51565 index_file = None
try:
index_file = vfs(index_path)
header = index_file.read(INDEX_HEADER.size)
if revlogmod.revlog.is_inline_index(header):
size = name_to_size[index_path]
stream-clone: smoothly detect and handle a case were a revlog is split...
r51534
Arseniy Alekseyev
stream-clone: avoid opening a revlog in case we do not need it...
r51565 # no split underneath, just return the stream
def get_stream():
fp = index_file
try:
fp.seek(0)
yield None
if size <= 65536:
yield fp.read(size)
else:
yield from util.filechunkiter(fp, limit=size)
finally:
fp.close()
s = get_stream()
next(s)
index_file = None
stream.append((index_path, s, size))
else:
rl = self.get_revlog_instance(repo).get_revlog()
rl_stream = rl.get_streams(max_changeset, force_inline=True)
for name, s, size in rl_stream:
if name_to_size.get(name, 0) != size:
msg = _(b"expected %d bytes but %d provided for %s")
msg %= name_to_size.get(name, 0), size, name
raise error.Abort(msg)
stream.extend(rl_stream)
finally:
if index_file is not None:
index_file.close()
stream-clone: implement decidated `get_streams` method for revlog...
r51533 files = self.files()
assert len(stream) == len(files), (
stream,
files,
self._path_prefix,
self.target_id,
)
return stream
store: add a `get_revlog_instance` method on revlog entries...
r51520 def get_revlog_instance(self, repo):
"""Obtain a revlog instance from this store entry
An instance of the appropriate class is returned.
"""
if self.is_changelog:
return changelog.changelog(repo.svfs)
elif self.is_manifestlog:
store: do not drop the final `/` when creating manifestlog instance...
r51521 mandir = self.target_id
store: add a `get_revlog_instance` method on revlog entries...
r51520 return manifest.manifestrevlog(
repo.nodeconstants, repo.svfs, tree=mandir
)
else:
return filelog.filelog(repo.svfs, self.target_id)
store: use specialized class for store entries...
r51366
store: add logic to group revlog file together...
r51372 def _gather_revlog(files_data):
"""group files per revlog prefix
The returns a two level nested dict. The top level key is the revlog prefix
without extension, the second level is all the file "suffix" that were
seen for this revlog and arbitrary file data as value.
"""
revlogs = collections.defaultdict(dict)
for u, value in files_data:
name, ext = _split_revlog_ext(u)
revlogs[name][ext] = value
return sorted(revlogs.items())
def _split_revlog_ext(filename):
"""split the revlog file prefix from the variable extension"""
if filename.endswith(REVLOG_FILES_LONG_EXT):
char = b'-'
else:
char = b'.'
idx = filename.rfind(char)
return filename[:idx], filename[idx:]
store: also gather files per revlog in `topfiles`...
r51374 def _ext_key(ext):
"""a key to order revlog suffix
important to issue .i after other entry."""
# the only important part of this order is to keep the `.i` last.
if ext.endswith(b'.n'):
return (0, ext)
elif ext.endswith(b'.nd'):
return (10, ext)
elif ext.endswith(b'.d'):
return (20, ext)
elif ext.endswith(b'.i'):
return (50, ext)
else:
return (40, ext)
Gregory Szorc
py3: use class X: instead of class X(object):...
r49801 class basicstore:
Adrian Buehlmann
introduce store classes...
r6840 '''base class for local repository stores'''
Augie Fackler
formatting: blacken the codebase...
r43346
FUJIWARA Katsunori
store: rename "openertype" argument to "vfstype"
r17651 def __init__(self, path, vfstype):
FUJIWARA Katsunori
store: initialize vfs field first to use it for initialization of others...
r17724 vfs = vfstype(path)
self.path = vfs.base
FUJIWARA Katsunori
store: invoke "os.stat()" for "createmode" initialization via vfs...
r17726 self.createmode = _calcmode(vfs)
FUJIWARA Katsunori
store: rename "op" variables to "vfs"
r17652 vfs.createmode = self.createmode
FUJIWARA Katsunori
store: invoke "os.path.isdir()" via vfs...
r17728 self.rawvfs = vfs
Pierre-Yves David
vfs: use 'vfs' module directly in 'mercurial.store'...
r31234 self.vfs = vfsmod.filtervfs(vfs, encodedir)
FUJIWARA Katsunori
store: initialize "vfs" fields by "vfs" constructors...
r17653 self.opener = self.vfs
Adrian Buehlmann
introduce store classes...
r6840
def join(self, f):
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 return self.path + b'/' + encodedir(f)
Adrian Buehlmann
introduce store classes...
r6840
store: split the wrapping of encodedstore between _wrap and datafiles...
r51386 def _walk(self, relpath, recurse, undecodable=None):
Valentin Gatien-Baron
store: return just one filename in walk functions...
r48691 '''yields (revlog_type, unencoded, size)'''
Adrian Buehlmann
store: remove pointless pathjoiner parameter...
r13426 path = self.path
if relpath:
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 path += b'/' + relpath
Adrian Buehlmann
store: remove pointless pathjoiner parameter...
r13426 striplen = len(self.path) + 1
Matt Mackall
store: simplify walking...
r6899 l = []
FUJIWARA Katsunori
store: invoke "os.path.isdir()" via vfs...
r17728 if self.rawvfs.isdir(path):
Matt Mackall
store: simplify walking...
r6899 visit = [path]
FUJIWARA Katsunori
store: invoke "osutil.listdir()" via vfs...
r17747 readdir = self.rawvfs.readdir
Matt Mackall
store: simplify walking...
r6899 while visit:
p = visit.pop()
FUJIWARA Katsunori
store: invoke "osutil.listdir()" via vfs...
r17747 for f, kind, st in readdir(p, stat=True):
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 fp = p + b'/' + f
store: stop relying on a `revlog_type` property...
r51564 if is_revlog(f, kind, st):
Matt Mackall
store: change handling of decoding errors
r6900 n = util.pconvert(fp[striplen:])
store: stop relying on a `revlog_type` property...
r51564 l.append((decodedir(n), st.st_size))
Matt Mackall
store: simplify walking...
r6899 elif kind == stat.S_IFDIR and recurse:
visit.append(fp)
store: change `_walk` return to `(filename, (type, size))`...
r51371
Bryan O'Sullivan
store: sort filenames in place
r17054 l.sort()
return l
Adrian Buehlmann
introduce store classes...
r6840
Kyle Lippincott
revlog: add a mechanism to verify expected file position before appending...
r47349 def changelog(self, trypending, concurrencychecker=None):
return changelog.changelog(
self.vfs,
trypending=trypending,
concurrencychecker=concurrencychecker,
)
Augie Fackler
localrepo: push manifestlog and changelog construction code into store...
r43175
Matt Harbison
manifest: drop the CamelCase name for `manifest.manifestlog`...
r52963 def manifestlog(self, repo, storenarrowmatch) -> manifest.manifestlog:
Joerg Sonnenberger
node: introduce nodeconstants class...
r47538 rootstore = manifest.manifestrevlog(repo.nodeconstants, self.vfs)
Augie Fackler
formatting: blacken the codebase...
r43346 return manifest.manifestlog(self.vfs, repo, rootstore, storenarrowmatch)
Augie Fackler
localrepo: push manifestlog and changelog construction code into store...
r43175
store: rename `datafiles` to `data_entries`...
r51397 def data_entries(
store: use a StoreEntry object instead of tuple for store files...
r51364 self, matcher=None, undecodable=None
store: use specialized class for store entries...
r51366 ) -> Generator[BaseStoreEntry, None, None]:
Valentin Gatien-Baron
store: return just one filename in walk functions...
r48691 """Like walk, but excluding the changelog and root manifest.
When [undecodable] is None, revlogs names that can't be
decoded cause an exception. When it is provided, it should
be a list and the filenames that can't be decoded are added
to it instead. This is very rarely needed."""
store: actually tag tree manifest revlogs as manifest revlogs...
r51375 dirs = [
store: use the revlog type from revlog's constant instead of custom one...
r51573 (b'data', KIND_FILELOG, False),
(b'meta', KIND_MANIFESTLOG, True),
store: actually tag tree manifest revlogs as manifest revlogs...
r51375 ]
store: properly compute the targer_id of manifestlog in no-fncache walk...
r51522 for base_dir, rl_type, strip_filename in dirs:
store: split the wrapping of encodedstore between _wrap and datafiles...
r51386 files = self._walk(base_dir, True, undecodable=undecodable)
store: actually tag tree manifest revlogs as manifest revlogs...
r51375 for revlog, details in _gather_revlog(files):
store: issue a single entry for each revlog...
r51389 revlog_target_id = revlog.split(b'/', 1)[1]
store: properly compute the targer_id of manifestlog in no-fncache walk...
r51522 if strip_filename and b'/' in revlog:
revlog_target_id = revlog_target_id.rsplit(b'/', 1)[0]
revlog_target_id += b'/'
store: issue a single entry for each revlog...
r51389 yield RevlogStoreEntry(
path_prefix=revlog,
revlog_type=rl_type,
target_id=revlog_target_id,
store: stop relying on a `revlog_type` property...
r51564 details=details,
store: issue a single entry for each revlog...
r51389 )
Adrian Buehlmann
introduce store classes...
r6840
store: make `walk` return an entry for obsolescence if requested so...
r51407 def top_entries(
self, phase=False, obsolescence=False
) -> Generator[BaseStoreEntry, None, None]:
store: yield phases before changelog...
r51406 if phase and self.vfs.exists(b'phaseroots'):
yield SimpleStoreEntry(
entry_path=b'phaseroots',
is_volatile=True,
)
store: make `walk` return an entry for obsolescence if requested so...
r51407 if obsolescence and self.vfs.exists(b'obsstore'):
# XXX if we had the file size it could be non-volatile
yield SimpleStoreEntry(
entry_path=b'obsstore',
is_volatile=True,
)
store: also gather files per revlog in `topfiles`...
r51374 files = reversed(self._walk(b'', False))
changelogs = collections.defaultdict(dict)
manifestlogs = collections.defaultdict(dict)
store: stop relying on a `revlog_type` property...
r51564 for u, s in files:
store: also return some information about the type of file `walk` found...
r47657 if u.startswith(b'00changelog'):
store: also gather files per revlog in `topfiles`...
r51374 name, ext = _split_revlog_ext(u)
store: stop relying on a `revlog_type` property...
r51564 changelogs[name][ext] = s
store: also return some information about the type of file `walk` found...
r47657 elif u.startswith(b'00manifest'):
store: also gather files per revlog in `topfiles`...
r51374 name, ext = _split_revlog_ext(u)
store: stop relying on a `revlog_type` property...
r51564 manifestlogs[name][ext] = s
store: also return some information about the type of file `walk` found...
r47657 else:
store: use specialized class for store entries...
r51366 yield SimpleStoreEntry(
store: rename `unencoded_path` to `entry_path` for StoreEntry...
r51388 entry_path=u,
store: stop relying on a `revlog_type` property...
r51564 is_volatile=False,
store: use specialized class for store entries...
r51366 file_size=s,
)
store: also gather files per revlog in `topfiles`...
r51374 # yield manifest before changelog
top_rl = [
store: use the revlog type from revlog's constant instead of custom one...
r51573 (manifestlogs, KIND_MANIFESTLOG),
(changelogs, KIND_CHANGELOG),
store: also gather files per revlog in `topfiles`...
r51374 ]
assert len(manifestlogs) <= 1
assert len(changelogs) <= 1
for data, revlog_type in top_rl:
for revlog, details in sorted(data.items()):
store: issue a single entry for each revlog...
r51389 yield RevlogStoreEntry(
path_prefix=revlog,
revlog_type=revlog_type,
target_id=b'',
store: stop relying on a `revlog_type` property...
r51564 details=details,
store: issue a single entry for each revlog...
r51389 )
Durham Goode
store: move top file walk to a separate function...
r19177
store: make `walk` return an entry for phase if requested so...
r51405 def walk(
store: make `walk` return an entry for obsolescence if requested so...
r51407 self, matcher=None, phase=False, obsolescence=False
store: make `walk` return an entry for phase if requested so...
r51405 ) -> Generator[BaseStoreEntry, None, None]:
Arseniy Alekseyev
comments: fix spelling
r51328 """return files related to data storage (ie: revlogs)
store: document the `walk` method...
r47612
store: make `walk` return an entry for phase if requested so...
r51405 yields instance from BaseStoreEntry subclasses
Pulkit Goyal
store: pass matcher to store.datafiles()...
r40376
if a matcher is passed, storage files of only those tracked paths
are passed with matches the matcher
Augie Fackler
formating: upgrade to black 20.8b1...
r46554 """
Adrian Buehlmann
introduce store classes...
r6840 # yield data files first
store: rename `datafiles` to `data_entries`...
r51397 for x in self.data_entries(matcher):
Adrian Buehlmann
introduce store classes...
r6840 yield x
store: make `walk` return an entry for obsolescence if requested so...
r51407 for x in self.top_entries(phase=phase, obsolescence=obsolescence):
Adrian Buehlmann
introduce store classes...
r6840 yield x
Matt Mackall
clone: get a list of files to clone from store
r6903 def copylist(self):
Pulkit Goyal
share: introduce config option to store requires in .hg/store...
r46055 return _data
Matt Mackall
clone: get a list of files to clone from store
r6903
Durham Goode
fncache: move fncache writing to be in a transaction...
r20883 def write(self, tr):
Adrian Buehlmann
fncachestore: defer updating the fncache file to a single file open...
r13391 pass
Durham Goode
caches: invalidate store caches when lock is taken...
r20884 def invalidatecaches(self):
pass
Durham Goode
fncache: clean up fncache during strips...
r20885 def markremoved(self, fn):
pass
smuralid
store: add a contains method to basicstore...
r17744 def __contains__(self, path):
'''Checks if the store contains path'''
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 path = b"/".join((b"data", path))
smuralid
store: add a contains method to basicstore...
r17744 # file?
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 if self.vfs.exists(path + b".i"):
smuralid
store: add a contains method to basicstore...
r17744 return True
# dir?
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 if not path.endswith(b"/"):
path = path + b"/"
FUJIWARA Katsunori
store: use "vfs.exists()" instead of "os.path.exists()"
r19903 return self.vfs.exists(path)
smuralid
store: add a contains method to basicstore...
r17744
Augie Fackler
formatting: blacken the codebase...
r43346
Matt Mackall
store: simplify class hierarchy
r6898 class encodedstore(basicstore):
FUJIWARA Katsunori
store: rename "openertype" argument to "vfstype"
r17651 def __init__(self, path, vfstype):
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 vfs = vfstype(path + b'/store')
FUJIWARA Katsunori
store: initialize vfs field first to use it for initialization of others...
r17724 self.path = vfs.base
FUJIWARA Katsunori
store: invoke "os.stat()" for "createmode" initialization via vfs...
r17726 self.createmode = _calcmode(vfs)
FUJIWARA Katsunori
store: rename "op" variables to "vfs"
r17652 vfs.createmode = self.createmode
FUJIWARA Katsunori
store: invoke "os.path.isdir()" via vfs...
r17728 self.rawvfs = vfs
Pierre-Yves David
vfs: use 'vfs' module directly in 'mercurial.store'...
r31234 self.vfs = vfsmod.filtervfs(vfs, encodefilename)
FUJIWARA Katsunori
store: initialize "vfs" fields by "vfs" constructors...
r17653 self.opener = self.vfs
Adrian Buehlmann
introduce store classes...
r6840
store: split the wrapping of encodedstore between _wrap and datafiles...
r51386 def _walk(self, relpath, recurse, undecodable=None):
old = super()._walk(relpath, recurse)
new = []
for f1, value in old:
Adrian Buehlmann
verify: check repo.store
r6892 try:
Valentin Gatien-Baron
store: return just one filename in walk functions...
r48691 f2 = decodefilename(f1)
Adrian Buehlmann
verify: check repo.store
r6892 except KeyError:
Valentin Gatien-Baron
store: return just one filename in walk functions...
r48691 if undecodable is None:
msg = _(b'undecodable revlog name %s') % f1
raise error.StorageError(msg)
else:
undecodable.append(f1)
continue
store: split the wrapping of encodedstore between _wrap and datafiles...
r51386 new.append((f2, value))
return new
store: rename `datafiles` to `data_entries`...
r51397 def data_entries(
store: split the wrapping of encodedstore between _wrap and datafiles...
r51386 self, matcher=None, undecodable=None
) -> Generator[BaseStoreEntry, None, None]:
store: rename `datafiles` to `data_entries`...
r51397 entries = super(encodedstore, self).data_entries(
undecodable=undecodable
)
store: split the wrapping of encodedstore between _wrap and datafiles...
r51386 for entry in entries:
store: do the revlog matching on entry directly...
r51387 if _match_tracked_entry(entry, matcher):
store: split the wrapping of encodedstore between _wrap and datafiles...
r51386 yield entry
Adrian Buehlmann
introduce store classes...
r6840
def join(self, f):
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 return self.path + b'/' + encodefilename(f)
Adrian Buehlmann
introduce store classes...
r6840
Matt Mackall
clone: get a list of files to clone from store
r6903 def copylist(self):
Pulkit Goyal
store: refactor space delimited list to proper data structure...
r45911 return [b'requires', b'00changelog.i'] + [b'store/' + f for f in _data]
Augie Fackler
formatting: blacken the codebase...
r43346
Matt Mackall
clone: get a list of files to clone from store
r6903
Gregory Szorc
py3: use class X: instead of class X(object):...
r49801 class fncache:
Benoit Boissinot
filelog encoding: move the encoding/decoding into store...
r8531 # the filename used to be partially encoded
# hence the encodedir/decodedir dance
FUJIWARA Katsunori
store: rename field name from "opener" to "vfs" in internal classes for fncache...
r17722 def __init__(self, vfs):
self.vfs = vfs
fncache: make it possible to ignore some file...
r51241 self._ignores = set()
Adrian Buehlmann
introduce fncache repository layout...
r7229 self.entries = None
Adrian Buehlmann
fncachestore: defer updating the fncache file to a single file open...
r13391 self._dirty = False
Pulkit Goyal
store: append to fncache if there are only new files to write...
r40767 # set of new additions to fncache
self.addls = set()
Adrian Buehlmann
introduce fncache repository layout...
r7229
Raphaël Gomès
fncache: refactor load check into a property...
r53066 @property
def is_loaded(self):
return self.entries is not None
Valentin Gatien-Baron
fncache: make debugrebuildfncache not fail on broken fncache...
r42960 def ensureloaded(self, warn=None):
Augie Fackler
formating: upgrade to black 20.8b1...
r46554 """read the fncache file if not already read.
Valentin Gatien-Baron
fncache: make debugrebuildfncache not fail on broken fncache...
r42960
If the file on disk is corrupted, raise. If warn is provided,
Augie Fackler
formating: upgrade to black 20.8b1...
r46554 warn and keep going instead."""
Raphaël Gomès
fncache: refactor load check into a property...
r53066 if not self.is_loaded:
Valentin Gatien-Baron
fncache: make debugrebuildfncache not fail on broken fncache...
r42960 self._load(warn)
def _load(self, warn=None):
Benoit Boissinot
store: refactor the fncache handling...
r8530 '''fill the entries from the fncache file'''
Adrian Buehlmann
fncachestore: defer updating the fncache file to a single file open...
r13391 self._dirty = False
Benoit Boissinot
store: refactor the fncache handling...
r8530 try:
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 fp = self.vfs(b'fncache', mode=b'rb')
Benoit Boissinot
store: refactor the fncache handling...
r8530 except IOError:
# skip nonexistent file
Bryan O'Sullivan
store: speed up read and write of large fncache files...
r16404 self.entries = set()
Benoit Boissinot
store: refactor the fncache handling...
r8530 return
Pulkit Goyal
store: don't read the whole fncache in memory...
r42144
self.entries = set()
chunk = b''
for c in iter(functools.partial(fp.read, fncache_chunksize), b''):
chunk += c
try:
p = chunk.rindex(b'\n')
Augie Fackler
formatting: blacken the codebase...
r43346 self.entries.update(decodedir(chunk[: p + 1]).splitlines())
chunk = chunk[p + 1 :]
Pulkit Goyal
store: don't read the whole fncache in memory...
r42144 except ValueError:
# substring '\n' not found, maybe the entry is bigger than the
# chunksize, so let's keep iterating
pass
Pulkit Goyal
store: error out if fncache does not ends with a newline...
r42147 if chunk:
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 msg = _(b"fncache does not ends with a newline")
Valentin Gatien-Baron
fncache: make debugrebuildfncache not fail on broken fncache...
r42960 if warn:
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 warn(msg + b'\n')
Valentin Gatien-Baron
fncache: make debugrebuildfncache not fail on broken fncache...
r42960 else:
Augie Fackler
formatting: blacken the codebase...
r43346 raise error.Abort(
msg,
hint=_(
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 b"use 'hg debugrebuildfncache' to "
b"rebuild the fncache"
Augie Fackler
formatting: blacken the codebase...
r43346 ),
)
Valentin Gatien-Baron
fncache: make debugrebuildfncache not fail on broken fncache...
r42960 self._checkentries(fp, warn)
Pulkit Goyal
store: move logic to check for invalid entry in fncache to own function...
r42139 fp.close()
Valentin Gatien-Baron
fncache: make debugrebuildfncache not fail on broken fncache...
r42960 def _checkentries(self, fp, warn):
Kyle Lippincott
black: make codebase compatible with black v21.4b2 and v20.8b1...
r47856 """make sure there is no empty string in entries"""
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 if b'' in self.entries:
Bryan O'Sullivan
store: speed up read and write of large fncache files...
r16404 fp.seek(0)
Gregory Szorc
py3: stop using util.iterfile()...
r49796 for n, line in enumerate(fp):
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 if not line.rstrip(b'\n'):
t = _(b'invalid entry in fncache, line %d') % (n + 1)
Valentin Gatien-Baron
fncache: make debugrebuildfncache not fail on broken fncache...
r42960 if warn:
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 warn(t + b'\n')
Valentin Gatien-Baron
fncache: make debugrebuildfncache not fail on broken fncache...
r42960 else:
raise error.Abort(t)
Adrian Buehlmann
introduce fncache repository layout...
r7229
Durham Goode
fncache: move fncache writing to be in a transaction...
r20883 def write(self, tr):
Bryan O'Sullivan
store: speed up read and write of large fncache files...
r16404 if self._dirty:
Raphaël Gomès
fncache: refactor load check into a property...
r53066 assert self.is_loaded
Pulkit Goyal
store: write fncache only once if there are both adds and removes...
r40779 self.entries = self.entries | self.addls
self.addls = set()
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 tr.addbackup(b'fncache')
fp = self.vfs(b'fncache', mode=b'wb', atomictemp=True)
Durham Goode
fncache: remove the rewriting logic...
r20879 if self.entries:
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 fp.write(encodedir(b'\n'.join(self.entries) + b'\n'))
Durham Goode
fncache: remove the rewriting logic...
r20879 fp.close()
self._dirty = False
Pulkit Goyal
store: append to fncache if there are only new files to write...
r40767 if self.addls:
# if we have just new entries, let's append them to the fncache
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 tr.addbackup(b'fncache')
fp = self.vfs(b'fncache', mode=b'ab', atomictemp=True)
Pulkit Goyal
store: append to fncache if there are only new files to write...
r40767 if self.addls:
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 fp.write(encodedir(b'\n'.join(self.addls) + b'\n'))
Pulkit Goyal
store: append to fncache if there are only new files to write...
r40767 fp.close()
self.entries = None
self.addls = set()
Benoit Boissinot
store: refactor the fncache handling...
r8530
fncache: make it possible to ignore some file...
r51241 def addignore(self, fn):
self._ignores.add(fn)
Benoit Boissinot
store: refactor the fncache handling...
r8530 def add(self, fn):
fncache: make it possible to ignore some file...
r51241 if fn in self._ignores:
return
Raphaël Gomès
fncache: refactor load check into a property...
r53066 if not self.is_loaded:
Benoit Boissinot
store: refactor the fncache handling...
r8530 self._load()
Adrian Buehlmann
store: only add new entries to the fncache file...
r10577 if fn not in self.entries:
Pulkit Goyal
store: append to fncache if there are only new files to write...
r40767 self.addls.add(fn)
Benoit Boissinot
store: refactor the fncache handling...
r8530
Durham Goode
fncache: clean up fncache during strips...
r20885 def remove(self, fn):
Raphaël Gomès
fncache: refactor load check into a property...
r53066 if not self.is_loaded:
Durham Goode
fncache: clean up fncache during strips...
r20885 self._load()
Pulkit Goyal
store: append to fncache if there are only new files to write...
r40767 if fn in self.addls:
self.addls.remove(fn)
return
Durham Goode
fncache: clean up fncache during strips...
r20885 try:
self.entries.remove(fn)
self._dirty = True
except KeyError:
pass
Adrian Buehlmann
store: move __contains__() implementation from class fncache into fncachestore...
r17782 def __contains__(self, fn):
Pulkit Goyal
store: append to fncache if there are only new files to write...
r40767 if fn in self.addls:
return True
Raphaël Gomès
fncache: refactor load check into a property...
r53066 if not self.is_loaded:
Benoit Boissinot
store: refactor the fncache handling...
r8530 self._load()
Adrian Buehlmann
store: move __contains__() implementation from class fncache into fncachestore...
r17782 return fn in self.entries
Benoit Boissinot
store: refactor the fncache handling...
r8530
def __iter__(self):
Raphaël Gomès
fncache: refactor load check into a property...
r53066 if not self.is_loaded:
Benoit Boissinot
store: refactor the fncache handling...
r8530 self._load()
Pulkit Goyal
store: append to fncache if there are only new files to write...
r40767 return iter(self.entries | self.addls)
Adrian Buehlmann
introduce fncache repository layout...
r7229
Augie Fackler
formatting: blacken the codebase...
r43346
Boris Feld
vfs: fix proxyvfs inheritance...
r41125 class _fncachevfs(vfsmod.proxyvfs):
FUJIWARA Katsunori
store: rename argument name from "op"(ener) to "vfs"
r17721 def __init__(self, vfs, fnc, encode):
Yuya Nishihara
vfs: rename auditvfs to proxyvfs...
r33412 vfsmod.proxyvfs.__init__(self, vfs)
Raphaël Gomès
fncachestore: add typing information...
r53067 self.fncache: fncache = fnc
Adrian Buehlmann
store: break up reference cycle introduced in 9cbff8a39a2a...
r14194 self.encode = encode
Raphaël Gomès
fncache: add attribute to check whether we're using dotencode...
r53068 self.uses_dotencode = encode is _pathencode
Adrian Buehlmann
store: break up reference cycle introduced in 9cbff8a39a2a...
r14194
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 def __call__(self, path, mode=b'r', *args, **kw):
Martijn Pieters
fncache: avoid loading the filename cache when not actually modifying it...
r38683 encoded = self.encode(path)
store: do not record file that are not part of a revlog in fncache...
r51360 if (
mode not in (b'r', b'rb')
and (path.startswith(b'data/') or path.startswith(b'meta/'))
store: stop relying on a `revlog_type` property...
r51564 and is_revlog_file(path)
Augie Fackler
formatting: blacken the codebase...
r43346 ):
Martijn Pieters
fncache: avoid loading the filename cache when not actually modifying it...
r38683 # do not trigger a fncache load when adding a file that already is
# known to exist.
Raphaël Gomès
fncache: refactor load check into a property...
r53066 notload = not self.fncache.is_loaded and (
Arseniy Alekseyev
fncache: fix a bug that corrupts the fncache after transaction rollback
r51705 # if the file has size zero, it should be considered as missing.
# Such zero-size files are the result of truncation when a
# transaction is aborted.
self.vfs.exists(encoded)
and self.vfs.stat(encoded).st_size
)
Martijn Pieters
fncache: avoid loading the filename cache when not actually modifying it...
r38683 if not notload:
self.fncache.add(path)
return self.vfs(encoded, mode, *args, **kw)
Adrian Buehlmann
store: break up reference cycle introduced in 9cbff8a39a2a...
r14194
Matt Harbison
store: fix a signature mismatch for a vfs subclass...
r52775 def join(self, path: Optional[bytes], *insidef: bytes) -> bytes:
insidef = (self.encode(f) for f in insidef)
FUJIWARA Katsunori
vfs: define "join()" in each classes derived from "abstractvfs"...
r17725 if path:
Matt Harbison
store: fix a signature mismatch for a vfs subclass...
r52775 return self.vfs.join(self.encode(path), *insidef)
FUJIWARA Katsunori
vfs: define "join()" in each classes derived from "abstractvfs"...
r17725 else:
Matt Harbison
store: fix a signature mismatch for a vfs subclass...
r52775 return self.vfs.join(path, *insidef)
FUJIWARA Katsunori
vfs: define "join()" in each classes derived from "abstractvfs"...
r17725
vfs: add a `register_file` method on the vfs class...
r48236 def register_file(self, path):
"""generic hook point to lets fncache steer its stew"""
if path.startswith(b'data/') or path.startswith(b'meta/'):
self.fncache.add(path)
Augie Fackler
formatting: blacken the codebase...
r43346
Adrian Buehlmann
introduce fncache repository layout...
r7229 class fncachestore(basicstore):
FUJIWARA Katsunori
store: rename "openertype" argument to "vfstype"
r17651 def __init__(self, path, vfstype, dotencode):
Adrian Buehlmann
store: move encode lambda logic into fncachestore...
r17591 if dotencode:
Bryan O'Sullivan
store: switch to C-based hashed path encoding
r18435 encode = _pathencode
Adrian Buehlmann
store: move encode lambda logic into fncachestore...
r17591 else:
encode = _plainhybridencode
Adrian Buehlmann
store: encode first period or space in filenames (issue1713)...
r12687 self.encode = encode
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 vfs = vfstype(path + b'/store')
FUJIWARA Katsunori
store: initialize vfs field first to use it for initialization of others...
r17724 self.path = vfs.base
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 self.pathsep = self.path + b'/'
FUJIWARA Katsunori
store: invoke "os.stat()" for "createmode" initialization via vfs...
r17726 self.createmode = _calcmode(vfs)
FUJIWARA Katsunori
store: rename "op" variables to "vfs"
r17652 vfs.createmode = self.createmode
FUJIWARA Katsunori
store: replace invocation of "getsize()" by "vfs.stat()"...
r17727 self.rawvfs = vfs
FUJIWARA Katsunori
store: rename "op" variables to "vfs"
r17652 fnc = fncache(vfs)
Simon Heimberg
store: eliminate reference cycle in fncachestore...
r9133 self.fncache = fnc
FUJIWARA Katsunori
store: initialize "vfs" fields by "vfs" constructors...
r17653 self.vfs = _fncachevfs(vfs, fnc, encode)
self.opener = self.vfs
Adrian Buehlmann
introduce fncache repository layout...
r7229
def join(self, f):
Bryan O'Sullivan
store: reduce string concatenation when joining...
r17562 return self.pathsep + self.encode(f)
Adrian Buehlmann
introduce fncache repository layout...
r7229
Matt Mackall
store: restore getsize method...
r17731 def getsize(self, path):
return self.rawvfs.stat(path).st_size
store: rename `datafiles` to `data_entries`...
r51397 def data_entries(
store: use a StoreEntry object instead of tuple for store files...
r51364 self, matcher=None, undecodable=None
store: use specialized class for store entries...
r51366 ) -> Generator[BaseStoreEntry, None, None]:
store: also group files by revlog in fncache version of datafiles...
r51373 # Note: all files in fncache should be revlog related, However the
# fncache might contains such file added by previous version of
# Mercurial.
store: stop relying on a `revlog_type` property...
r51564 files = ((f, None) for f in self.fncache if is_revlog_file(f))
store: also group files by revlog in fncache version of datafiles...
r51373 by_revlog = _gather_revlog(files)
for revlog, details in by_revlog:
store: actually tag tree manifest revlogs as manifest revlogs...
r51375 if revlog.startswith(b'data/'):
store: use the revlog type from revlog's constant instead of custom one...
r51573 rl_type = KIND_FILELOG
store: add a `target_id` attribute on RevlogStoreEntry...
r51376 revlog_target_id = revlog.split(b'/', 1)[1]
store: actually tag tree manifest revlogs as manifest revlogs...
r51375 elif revlog.startswith(b'meta/'):
store: use the revlog type from revlog's constant instead of custom one...
r51573 rl_type = KIND_MANIFESTLOG
store: add a `target_id` attribute on RevlogStoreEntry...
r51376 # drop the initial directory and the `00manifest` file part
tmp = revlog.split(b'/', 1)[1]
revlog_target_id = tmp.rsplit(b'/', 1)[0] + b'/'
store: actually tag tree manifest revlogs as manifest revlogs...
r51375 else:
# unreachable
assert False, revlog
store: issue a single entry for each revlog...
r51389 entry = RevlogStoreEntry(
path_prefix=revlog,
revlog_type=rl_type,
target_id=revlog_target_id,
store: stop relying on a `revlog_type` property...
r51564 details=details,
store: issue a single entry for each revlog...
r51389 )
if _match_tracked_entry(entry, matcher):
yield entry
Adrian Buehlmann
introduce fncache repository layout...
r7229
def copylist(self):
Augie Fackler
formatting: blacken the codebase...
r43346 d = (
Pulkit Goyal
store: refactor space delimited list to proper data structure...
r45911 b'bookmarks',
b'narrowspec',
b'data',
b'meta',
b'dh',
b'fncache',
b'phaseroots',
b'obsstore',
b'00manifest.d',
b'00manifest.i',
b'00changelog.d',
b'00changelog.i',
Pulkit Goyal
share: introduce config option to store requires in .hg/store...
r46055 b'requires',
Augie Fackler
formatting: blacken the codebase...
r43346 )
Pulkit Goyal
store: refactor space delimited list to proper data structure...
r45911 return [b'requires', b'00changelog.i'] + [b'store/' + f for f in d]
Adrian Buehlmann
introduce fncache repository layout...
r7229
Durham Goode
fncache: move fncache writing to be in a transaction...
r20883 def write(self, tr):
self.fncache.write(tr)
Adrian Buehlmann
fncachestore: defer updating the fncache file to a single file open...
r13391
Durham Goode
caches: invalidate store caches when lock is taken...
r20884 def invalidatecaches(self):
self.fncache.entries = None
Pulkit Goyal
store: append to fncache if there are only new files to write...
r40767 self.fncache.addls = set()
Durham Goode
caches: invalidate store caches when lock is taken...
r20884
Durham Goode
fncache: clean up fncache during strips...
r20885 def markremoved(self, fn):
self.fncache.remove(fn)
Adrian Buehlmann
store: add new _exists helper function on fncachestore
r17783 def _exists(self, f):
ef = self.encode(f)
try:
self.getsize(ef)
return True
Manuel Jacob
py3: catch FileNotFoundError instead of checking errno == ENOENT
r50201 except FileNotFoundError:
Adrian Buehlmann
store: add new _exists helper function on fncachestore
r17783 return False
smuralid
store: add a contains method to fncachestore...
r17745 def __contains__(self, path):
'''Checks if the store contains path'''
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 path = b"/".join((b"data", path))
Adrian Buehlmann
store: move __contains__() implementation from class fncache into fncachestore...
r17782 # check for files (exact match)
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 e = path + b'.i'
Adrian Buehlmann
store: fncache may contain non-existent entries (fixes b9a56b816ff2)
r17784 if e in self.fncache and self._exists(e):
Adrian Buehlmann
store: move __contains__() implementation from class fncache into fncachestore...
r17782 return True
# now check for directories (prefix match)
Augie Fackler
formatting: byteify all mercurial/ and hgext/ string literals...
r43347 if not path.endswith(b'/'):
path += b'/'
Adrian Buehlmann
store: move __contains__() implementation from class fncache into fncachestore...
r17782 for e in self.fncache:
Adrian Buehlmann
store: fncache may contain non-existent entries (fixes b9a56b816ff2)
r17784 if e.startswith(path) and self._exists(e):
Adrian Buehlmann
store: move __contains__() implementation from class fncache into fncachestore...
r17782 return True
return False