upstream/mercurial-mirror Commit - r51531:8fc10bfd

1

# store.py - repository store handling for Mercurial

1

# store.py - repository store handling for Mercurial

2

#

2

#

3

4

#

4

#

5

# This software may be used and distributed according to the terms of the

5

# This software may be used and distributed according to the terms of the

6

# GNU General Public License version 2 or any later version.

6

# GNU General Public License version 2 or any later version.

7

8

import collections

8

import collections

9

import functools

9

import functools

10

import os

10

import os

11

import re

11

import re

12

import stat

12

import stat

13

from typing import Generator

13

from typing import Generator, List

14

15

from .i18n import _

15

from .i18n import _

16

from .pycompat import getattr

16

from .pycompat import getattr

17

from .thirdparty import attr

17

from .thirdparty import attr

18

from .node import hex

18

from .node import hex

19

from . import (

19

from . import (

20

changelog,

20

changelog,

21

error,

21

error,

22

filelog,

22

filelog,

23

manifest,

23

manifest,

24

policy,

24

policy,

25

pycompat,

25

pycompat,

26

util,

26

util,

27

vfs as vfsmod,

27

vfs as vfsmod,

28

)

28

)

29

from .utils import hashutil

29

from .utils import hashutil

30

31

parsers = policy.importmod('parsers')

31

parsers = policy.importmod('parsers')

32

# how much bytes should be read from fncache in one read

32

# how much bytes should be read from fncache in one read

33

# It is done to prevent loading large fncache files into memory

33

# It is done to prevent loading large fncache files into memory

34

fncache_chunksize = 10 ** 6

34

fncache_chunksize = 10 ** 6

35

36

37

def _match_tracked_entry(entry, matcher):

37

def _match_tracked_entry(entry, matcher):

38

"""parses a fncache entry and returns whether the entry is tracking a path

38

"""parses a fncache entry and returns whether the entry is tracking a path

39

matched by matcher or not.

39

matched by matcher or not.

40

41

If matcher is None, returns True"""

41

If matcher is None, returns True"""

42

43

if matcher is None:

43

if matcher is None:

44

return True

44

return True

45

if entry.is_filelog:

45

if entry.is_filelog:

46

return matcher(entry.target_id)

46

return matcher(entry.target_id)

47

elif entry.is_manifestlog:

47

elif entry.is_manifestlog:

48

return matcher.visitdir(entry.target_id.rstrip(b'/'))

48

return matcher.visitdir(entry.target_id.rstrip(b'/'))

49

raise error.ProgrammingError(b"cannot process entry %r" % entry)

49

raise error.ProgrammingError(b"cannot process entry %r" % entry)

50

51

52

# This avoids a collision between a file named foo and a dir named

52

# This avoids a collision between a file named foo and a dir named

53

# foo.i or foo.d

53

# foo.i or foo.d

54

def _encodedir(path):

54

def _encodedir(path):

55

"""

55

"""

56

>>> _encodedir(b'data/foo.i')

56

>>> _encodedir(b'data/foo.i')

57

'data/foo.i'

57

'data/foo.i'

58

>>> _encodedir(b'data/foo.i/bla.i')

58

>>> _encodedir(b'data/foo.i/bla.i')

59

'data/foo.i.hg/bla.i'

59

'data/foo.i.hg/bla.i'

60

>>> _encodedir(b'data/foo.i.hg/bla.i')

60

>>> _encodedir(b'data/foo.i.hg/bla.i')

61

'data/foo.i.hg.hg/bla.i'

61

'data/foo.i.hg.hg/bla.i'

62

>>> _encodedir(b'data/foo.i\\ndata/foo.i/bla.i\\ndata/foo.i.hg/bla.i\\n')

62

>>> _encodedir(b'data/foo.i\\ndata/foo.i/bla.i\\ndata/foo.i.hg/bla.i\\n')

63

'data/foo.i\\ndata/foo.i.hg/bla.i\\ndata/foo.i.hg.hg/bla.i\\n'

63

'data/foo.i\\ndata/foo.i.hg/bla.i\\ndata/foo.i.hg.hg/bla.i\\n'

64

"""

64

"""

65

return (

65

return (

66

path.replace(b".hg/", b".hg.hg/")

66

path.replace(b".hg/", b".hg.hg/")

67

.replace(b".i/", b".i.hg/")

67

.replace(b".i/", b".i.hg/")

68

.replace(b".d/", b".d.hg/")

68

.replace(b".d/", b".d.hg/")

69

)

69

)

70

71

72

encodedir = getattr(parsers, 'encodedir', _encodedir)

72

encodedir = getattr(parsers, 'encodedir', _encodedir)

73

74

75

def decodedir(path):

75

def decodedir(path):

76

"""

76

"""

77

>>> decodedir(b'data/foo.i')

77

>>> decodedir(b'data/foo.i')

78

'data/foo.i'

78

'data/foo.i'

79

>>> decodedir(b'data/foo.i.hg/bla.i')

79

>>> decodedir(b'data/foo.i.hg/bla.i')

80

'data/foo.i/bla.i'

80

'data/foo.i/bla.i'

81

>>> decodedir(b'data/foo.i.hg.hg/bla.i')

81

>>> decodedir(b'data/foo.i.hg.hg/bla.i')

82

'data/foo.i.hg/bla.i'

82

'data/foo.i.hg/bla.i'

83

"""

83

"""

84

if b".hg/" not in path:

84

if b".hg/" not in path:

85

return path

85

return path

86

return (

86

return (

87

path.replace(b".d.hg/", b".d/")

87

path.replace(b".d.hg/", b".d/")

88

.replace(b".i.hg/", b".i/")

88

.replace(b".i.hg/", b".i/")

89

.replace(b".hg.hg/", b".hg/")

89

.replace(b".hg.hg/", b".hg/")

90

)

90

)

91

92

93

def _reserved():

93

def _reserved():

94

"""characters that are problematic for filesystems

94

"""characters that are problematic for filesystems

95

96

* ascii escapes (0..31)

96

* ascii escapes (0..31)

97

* ascii hi (126..255)

97

* ascii hi (126..255)

98

* windows specials

98

* windows specials

99

100

these characters will be escaped by encodefunctions

100

these characters will be escaped by encodefunctions

101

"""

101

"""

102

winreserved = [ord(x) for x in u'\\:*?"<>|']

102

winreserved = [ord(x) for x in u'\\:*?"<>|']

103

for x in range(32):

103

for x in range(32):

104

yield x

104

yield x

105

for x in range(126, 256):

105

for x in range(126, 256):

106

yield x

106

yield x

107

for x in winreserved:

107

for x in winreserved:

108

yield x

108

yield x

109

110

111

def _buildencodefun():

111

def _buildencodefun():

112

"""

112

"""

113

>>> enc, dec = _buildencodefun()

113

>>> enc, dec = _buildencodefun()

114

115

>>> enc(b'nothing/special.txt')

115

>>> enc(b'nothing/special.txt')

116

'nothing/special.txt'

116

'nothing/special.txt'

117

>>> dec(b'nothing/special.txt')

117

>>> dec(b'nothing/special.txt')

118

'nothing/special.txt'

118

'nothing/special.txt'

119

120

>>> enc(b'HELLO')

120

>>> enc(b'HELLO')

121

'_h_e_l_l_o'

121

'_h_e_l_l_o'

122

>>> dec(b'_h_e_l_l_o')

122

>>> dec(b'_h_e_l_l_o')

123

'HELLO'

123

'HELLO'

124

125

>>> enc(b'hello:world?')

125

>>> enc(b'hello:world?')

126

'hello~3aworld~3f'

126

'hello~3aworld~3f'

127

>>> dec(b'hello~3aworld~3f')

127

>>> dec(b'hello~3aworld~3f')

128

'hello:world?'

128

'hello:world?'

129

130

>>> enc(b'the\\x07quick\\xADshot')

130

>>> enc(b'the\\x07quick\\xADshot')

131

'the~07quick~adshot'

131

'the~07quick~adshot'

132

>>> dec(b'the~07quick~adshot')

132

>>> dec(b'the~07quick~adshot')

133

'the\\x07quick\\xadshot'

133

'the\\x07quick\\xadshot'

134

"""

134

"""

135

e = b'_'

135

e = b'_'

136

xchr = pycompat.bytechr

136

xchr = pycompat.bytechr

137

asciistr = list(map(xchr, range(127)))

137

asciistr = list(map(xchr, range(127)))

138

capitals = list(range(ord(b"A"), ord(b"Z") + 1))

138

capitals = list(range(ord(b"A"), ord(b"Z") + 1))

139

140

cmap = {x: x for x in asciistr}

140

cmap = {x: x for x in asciistr}

141

for x in _reserved():

141

for x in _reserved():

142

cmap[xchr(x)] = b"~%02x" % x

142

cmap[xchr(x)] = b"~%02x" % x

143

for x in capitals + [ord(e)]:

143

for x in capitals + [ord(e)]:

144

cmap[xchr(x)] = e + xchr(x).lower()

144

cmap[xchr(x)] = e + xchr(x).lower()

145

146

dmap = {}

146

dmap = {}

147

for k, v in cmap.items():

147

for k, v in cmap.items():

148

dmap[v] = k

148

dmap[v] = k

149

150

def decode(s):

150

def decode(s):

151

i = 0

151

i = 0

152

while i < len(s):

152

while i < len(s):

153

for l in range(1, 4):

153

for l in range(1, 4):

154

try:

154

try:

155

yield dmap[s[i : i + l]]

155

yield dmap[s[i : i + l]]

156

i += l

156

i += l

157

break

157

break

158

except KeyError:

158

except KeyError:

159

pass

159

pass

160

else:

160

else:

161

raise KeyError

161

raise KeyError

162

163

return (

163

return (

164

lambda s: b''.join([cmap[s[c : c + 1]] for c in range(len(s))]),

164

lambda s: b''.join([cmap[s[c : c + 1]] for c in range(len(s))]),

165

lambda s: b''.join(list(decode(s))),

165

lambda s: b''.join(list(decode(s))),

166

)

166

)

167

168

169

_encodefname, _decodefname = _buildencodefun()

169

_encodefname, _decodefname = _buildencodefun()

170

171

172

def encodefilename(s):

172

def encodefilename(s):

173

"""

173

"""

174

>>> encodefilename(b'foo.i/bar.d/bla.hg/hi:world?/HELLO')

174

>>> encodefilename(b'foo.i/bar.d/bla.hg/hi:world?/HELLO')

175

'foo.i.hg/bar.d.hg/bla.hg.hg/hi~3aworld~3f/_h_e_l_l_o'

175

'foo.i.hg/bar.d.hg/bla.hg.hg/hi~3aworld~3f/_h_e_l_l_o'

176

"""

176

"""

177

return _encodefname(encodedir(s))

177

return _encodefname(encodedir(s))

178

179

180

def decodefilename(s):

180

def decodefilename(s):

181

"""

181

"""

182

>>> decodefilename(b'foo.i.hg/bar.d.hg/bla.hg.hg/hi~3aworld~3f/_h_e_l_l_o')

182

>>> decodefilename(b'foo.i.hg/bar.d.hg/bla.hg.hg/hi~3aworld~3f/_h_e_l_l_o')

183

'foo.i/bar.d/bla.hg/hi:world?/HELLO'

183

'foo.i/bar.d/bla.hg/hi:world?/HELLO'

184

"""

184

"""

185

return decodedir(_decodefname(s))

185

return decodedir(_decodefname(s))

186

187

188

def _buildlowerencodefun():

188

def _buildlowerencodefun():

189

"""

189

"""

190

>>> f = _buildlowerencodefun()

190

>>> f = _buildlowerencodefun()

191

>>> f(b'nothing/special.txt')

191

>>> f(b'nothing/special.txt')

192

'nothing/special.txt'

192

'nothing/special.txt'

193

>>> f(b'HELLO')

193

>>> f(b'HELLO')

194

'hello'

194

'hello'

195

>>> f(b'hello:world?')

195

>>> f(b'hello:world?')

196

'hello~3aworld~3f'

196

'hello~3aworld~3f'

197

>>> f(b'the\\x07quick\\xADshot')

197

>>> f(b'the\\x07quick\\xADshot')

198

'the~07quick~adshot'

198

'the~07quick~adshot'

199

"""

199

"""

200

xchr = pycompat.bytechr

200

xchr = pycompat.bytechr

201

cmap = {xchr(x): xchr(x) for x in range(127)}

201

cmap = {xchr(x): xchr(x) for x in range(127)}

202

for x in _reserved():

202

for x in _reserved():

203

cmap[xchr(x)] = b"~%02x" % x

203

cmap[xchr(x)] = b"~%02x" % x

204

for x in range(ord(b"A"), ord(b"Z") + 1):

204

for x in range(ord(b"A"), ord(b"Z") + 1):

205

cmap[xchr(x)] = xchr(x).lower()

205

cmap[xchr(x)] = xchr(x).lower()

206

207

def lowerencode(s):

207

def lowerencode(s):

208

return b"".join([cmap[c] for c in pycompat.iterbytestr(s)])

208

return b"".join([cmap[c] for c in pycompat.iterbytestr(s)])

209

210

return lowerencode

210

return lowerencode

211

212

213

lowerencode = getattr(parsers, 'lowerencode', None) or _buildlowerencodefun()

213

lowerencode = getattr(parsers, 'lowerencode', None) or _buildlowerencodefun()

214

215

# Windows reserved names: con, prn, aux, nul, com1..com9, lpt1..lpt9

215

# Windows reserved names: con, prn, aux, nul, com1..com9, lpt1..lpt9

216

_winres3 = (b'aux', b'con', b'prn', b'nul') # length 3

216

_winres3 = (b'aux', b'con', b'prn', b'nul') # length 3

217

_winres4 = (b'com', b'lpt') # length 4 (with trailing 1..9)

217

_winres4 = (b'com', b'lpt') # length 4 (with trailing 1..9)

218

219

220

def _auxencode(path, dotencode):

220

def _auxencode(path, dotencode):

221

"""

221

"""

222

Encodes filenames containing names reserved by Windows or which end in

222

Encodes filenames containing names reserved by Windows or which end in

223

period or space. Does not touch other single reserved characters c.

223

period or space. Does not touch other single reserved characters c.

224

Specifically, c in '\\:*?"<>|' or ord(c) <= 31 are *not* encoded here.

224

Specifically, c in '\\:*?"<>|' or ord(c) <= 31 are *not* encoded here.

225

Additionally encodes space or period at the beginning, if dotencode is

225

Additionally encodes space or period at the beginning, if dotencode is

226

True. Parameter path is assumed to be all lowercase.

226

True. Parameter path is assumed to be all lowercase.

227

A segment only needs encoding if a reserved name appears as a

227

A segment only needs encoding if a reserved name appears as a

228

basename (e.g. "aux", "aux.foo"). A directory or file named "foo.aux"

228

basename (e.g. "aux", "aux.foo"). A directory or file named "foo.aux"

229

doesn't need encoding.

229

doesn't need encoding.

230

231

>>> s = b'.foo/aux.txt/txt.aux/con/prn/nul/foo.'

231

>>> s = b'.foo/aux.txt/txt.aux/con/prn/nul/foo.'

232

>>> _auxencode(s.split(b'/'), True)

232

>>> _auxencode(s.split(b'/'), True)

233

['~2efoo', 'au~78.txt', 'txt.aux', 'co~6e', 'pr~6e', 'nu~6c', 'foo~2e']

233

['~2efoo', 'au~78.txt', 'txt.aux', 'co~6e', 'pr~6e', 'nu~6c', 'foo~2e']

234

>>> s = b'.com1com2/lpt9.lpt4.lpt1/conprn/com0/lpt0/foo.'

234

>>> s = b'.com1com2/lpt9.lpt4.lpt1/conprn/com0/lpt0/foo.'

235

>>> _auxencode(s.split(b'/'), False)

235

>>> _auxencode(s.split(b'/'), False)

236

['.com1com2', 'lp~749.lpt4.lpt1', 'conprn', 'com0', 'lpt0', 'foo~2e']

236

['.com1com2', 'lp~749.lpt4.lpt1', 'conprn', 'com0', 'lpt0', 'foo~2e']

237

>>> _auxencode([b'foo. '], True)

237

>>> _auxencode([b'foo. '], True)

238

['foo.~20']

238

['foo.~20']

239

>>> _auxencode([b' .foo'], True)

239

>>> _auxencode([b' .foo'], True)

240

['~20.foo']

240

['~20.foo']

241

"""

241

"""

242

for i, n in enumerate(path):

242

for i, n in enumerate(path):

243

if not n:

243

if not n:

244

continue

244

continue

245

if dotencode and n[0] in b'. ':

245

if dotencode and n[0] in b'. ':

246

n = b"~%02x" % ord(n[0:1]) + n[1:]

246

n = b"~%02x" % ord(n[0:1]) + n[1:]

247

path[i] = n

247

path[i] = n

248

else:

248

else:

249

l = n.find(b'.')

249

l = n.find(b'.')

250

if l == -1:

250

if l == -1:

251

l = len(n)

251

l = len(n)

252

if (l == 3 and n[:3] in _winres3) or (

252

if (l == 3 and n[:3] in _winres3) or (

253

l == 4

253

l == 4

254

and n[3:4] <= b'9'

254

and n[3:4] <= b'9'

255

and n[3:4] >= b'1'

255

and n[3:4] >= b'1'

256

and n[:3] in _winres4

256

and n[:3] in _winres4

257

):

257

):

258

# encode third letter ('aux' -> 'au~78')

258

# encode third letter ('aux' -> 'au~78')

259

ec = b"~%02x" % ord(n[2:3])

259

ec = b"~%02x" % ord(n[2:3])

260

n = n[0:2] + ec + n[3:]

260

n = n[0:2] + ec + n[3:]

261

path[i] = n

261

path[i] = n

262

if n[-1] in b'. ':

262

if n[-1] in b'. ':

263

# encode last period or space ('foo...' -> 'foo..~2e')

263

# encode last period or space ('foo...' -> 'foo..~2e')

264

path[i] = n[:-1] + b"~%02x" % ord(n[-1:])

264

path[i] = n[:-1] + b"~%02x" % ord(n[-1:])

265

return path

265

return path

266

267

268

_maxstorepathlen = 120

268

_maxstorepathlen = 120

269

_dirprefixlen = 8

269

_dirprefixlen = 8

270

_maxshortdirslen = 8 * (_dirprefixlen + 1) - 4

270

_maxshortdirslen = 8 * (_dirprefixlen + 1) - 4

271

272

273

def _hashencode(path, dotencode):

273

def _hashencode(path, dotencode):

274

digest = hex(hashutil.sha1(path).digest())

274

digest = hex(hashutil.sha1(path).digest())

275

le = lowerencode(path[5:]).split(b'/') # skips prefix 'data/' or 'meta/'

275

le = lowerencode(path[5:]).split(b'/') # skips prefix 'data/' or 'meta/'

276

parts = _auxencode(le, dotencode)

276

parts = _auxencode(le, dotencode)

277

basename = parts[-1]

277

basename = parts[-1]

278

_root, ext = os.path.splitext(basename)

278

_root, ext = os.path.splitext(basename)

279

sdirs = []

279

sdirs = []

280

sdirslen = 0

280

sdirslen = 0

281

for p in parts[:-1]:

281

for p in parts[:-1]:

282

d = p[:_dirprefixlen]

282

d = p[:_dirprefixlen]

283

if d[-1] in b'. ':

283

if d[-1] in b'. ':

284

# Windows can't access dirs ending in period or space

284

# Windows can't access dirs ending in period or space

285

d = d[:-1] + b'_'

285

d = d[:-1] + b'_'

286

if sdirslen == 0:

286

if sdirslen == 0:

287

t = len(d)

287

t = len(d)

288

else:

288

else:

289

t = sdirslen + 1 + len(d)

289

t = sdirslen + 1 + len(d)

290

if t > _maxshortdirslen:

290

if t > _maxshortdirslen:

291

break

291

break

292

sdirs.append(d)

292

sdirs.append(d)

293

sdirslen = t

293

sdirslen = t

294

dirs = b'/'.join(sdirs)

294

dirs = b'/'.join(sdirs)

295

if len(dirs) > 0:

295

if len(dirs) > 0:

296

dirs += b'/'

296

dirs += b'/'

297

res = b'dh/' + dirs + digest + ext

297

res = b'dh/' + dirs + digest + ext

298

spaceleft = _maxstorepathlen - len(res)

298

spaceleft = _maxstorepathlen - len(res)

299

if spaceleft > 0:

299

if spaceleft > 0:

300

filler = basename[:spaceleft]

300

filler = basename[:spaceleft]

301

res = b'dh/' + dirs + filler + digest + ext

301

res = b'dh/' + dirs + filler + digest + ext

302

return res

302

return res

303

304

305

def _hybridencode(path, dotencode):

305

def _hybridencode(path, dotencode):

306

"""encodes path with a length limit

306

"""encodes path with a length limit

307

308

Encodes all paths that begin with 'data/', according to the following.

308

Encodes all paths that begin with 'data/', according to the following.

309

310

Default encoding (reversible):

310

Default encoding (reversible):

311

312

Encodes all uppercase letters 'X' as '_x'. All reserved or illegal

312

Encodes all uppercase letters 'X' as '_x'. All reserved or illegal

313

characters are encoded as '~xx', where xx is the two digit hex code

313

characters are encoded as '~xx', where xx is the two digit hex code

314

of the character (see encodefilename).

314

of the character (see encodefilename).

315

Relevant path components consisting of Windows reserved filenames are

315

Relevant path components consisting of Windows reserved filenames are

316

masked by encoding the third character ('aux' -> 'au~78', see _auxencode).

316

masked by encoding the third character ('aux' -> 'au~78', see _auxencode).

317

318

Hashed encoding (not reversible):

318

Hashed encoding (not reversible):

319

320

If the default-encoded path is longer than _maxstorepathlen, a

320

If the default-encoded path is longer than _maxstorepathlen, a

321

non-reversible hybrid hashing of the path is done instead.

321

non-reversible hybrid hashing of the path is done instead.

322

This encoding uses up to _dirprefixlen characters of all directory

322

This encoding uses up to _dirprefixlen characters of all directory

323

levels of the lowerencoded path, but not more levels than can fit into

323

levels of the lowerencoded path, but not more levels than can fit into

324

_maxshortdirslen.

324

_maxshortdirslen.

325

Then follows the filler followed by the sha digest of the full path.

325

Then follows the filler followed by the sha digest of the full path.

326

The filler is the beginning of the basename of the lowerencoded path

326

The filler is the beginning of the basename of the lowerencoded path

327

(the basename is everything after the last path separator). The filler

327

(the basename is everything after the last path separator). The filler

328

is as long as possible, filling in characters from the basename until

328

is as long as possible, filling in characters from the basename until

329

the encoded path has _maxstorepathlen characters (or all chars of the

329

the encoded path has _maxstorepathlen characters (or all chars of the

330

basename have been taken).

330

basename have been taken).

331

The extension (e.g. '.i' or '.d') is preserved.

331

The extension (e.g. '.i' or '.d') is preserved.

332

333

The string 'data/' at the beginning is replaced with 'dh/', if the hashed

333

The string 'data/' at the beginning is replaced with 'dh/', if the hashed

334

encoding was used.

334

encoding was used.

335

"""

335

"""

336

path = encodedir(path)

336

path = encodedir(path)

337

ef = _encodefname(path).split(b'/')

337

ef = _encodefname(path).split(b'/')

338

res = b'/'.join(_auxencode(ef, dotencode))

338

res = b'/'.join(_auxencode(ef, dotencode))

339

if len(res) > _maxstorepathlen:

339

if len(res) > _maxstorepathlen:

340

res = _hashencode(path, dotencode)

340

res = _hashencode(path, dotencode)

341

return res

341

return res

342

343

344

def _pathencode(path):

344

def _pathencode(path):

345

de = encodedir(path)

345

de = encodedir(path)

346

if len(path) > _maxstorepathlen:

346

if len(path) > _maxstorepathlen:

347

return _hashencode(de, True)

347

return _hashencode(de, True)

348

ef = _encodefname(de).split(b'/')

348

ef = _encodefname(de).split(b'/')

349

res = b'/'.join(_auxencode(ef, True))

349

res = b'/'.join(_auxencode(ef, True))

350

if len(res) > _maxstorepathlen:

350

if len(res) > _maxstorepathlen:

351

return _hashencode(de, True)

351

return _hashencode(de, True)

352

return res

352

return res

353

354

355

_pathencode = getattr(parsers, 'pathencode', _pathencode)

355

_pathencode = getattr(parsers, 'pathencode', _pathencode)

356

357

358

def _plainhybridencode(f):

358

def _plainhybridencode(f):

359

return _hybridencode(f, False)

359

return _hybridencode(f, False)

360

361

362

def _calcmode(vfs):

362

def _calcmode(vfs):

363

try:

363

try:

364

# files in .hg/ will be created using this mode

364

# files in .hg/ will be created using this mode

365

mode = vfs.stat().st_mode

365

mode = vfs.stat().st_mode

366

# avoid some useless chmods

366

# avoid some useless chmods

367

if (0o777 & ~util.umask) == (0o777 & mode):

367

if (0o777 & ~util.umask) == (0o777 & mode):

368

mode = None

368

mode = None

369

except OSError:

369

except OSError:

370

mode = None

370

mode = None

371

return mode

371

return mode

372

373

374

_data = [

374

_data = [

375

b'bookmarks',

375

b'bookmarks',

376

b'narrowspec',

376

b'narrowspec',

377

b'data',

377

b'data',

378

b'meta',

378

b'meta',

379

b'00manifest.d',

379

b'00manifest.d',

380

b'00manifest.i',

380

b'00manifest.i',

381

b'00changelog.d',

381

b'00changelog.d',

382

b'00changelog.i',

382

b'00changelog.i',

383

b'phaseroots',

383

b'phaseroots',

384

b'obsstore',

384

b'obsstore',

385

b'requires',

385

b'requires',

386

]

386

]

387

388

REVLOG_FILES_MAIN_EXT = (b'.i',)

388

REVLOG_FILES_MAIN_EXT = (b'.i',)

389

REVLOG_FILES_OTHER_EXT = (

389

REVLOG_FILES_OTHER_EXT = (

390

b'.idx',

390

b'.idx',

391

b'.d',

391

b'.d',

392

b'.dat',

392

b'.dat',

393

b'.n',

393

b'.n',

394

b'.nd',

394

b'.nd',

395

b'.sda',

395

b'.sda',

396

)

396

)

397

# file extension that also use a `-SOMELONGIDHASH.ext` form

397

# file extension that also use a `-SOMELONGIDHASH.ext` form

398

REVLOG_FILES_LONG_EXT = (

398

REVLOG_FILES_LONG_EXT = (

399

b'.nd',

399

b'.nd',

400

b'.idx',

400

b'.idx',

401

b'.dat',

401

b'.dat',

402

b'.sda',

402

b'.sda',

403

)

403

)

404

# files that are "volatile" and might change between listing and streaming

404

# files that are "volatile" and might change between listing and streaming

405

#

405

#

406

# note: the ".nd" file are nodemap data and won't "change" but they might be

406

# note: the ".nd" file are nodemap data and won't "change" but they might be

407

# deleted.

407

# deleted.

408

REVLOG_FILES_VOLATILE_EXT = (b'.n', b'.nd')

408

REVLOG_FILES_VOLATILE_EXT = (b'.n', b'.nd')

409

410

# some exception to the above matching

410

# some exception to the above matching

411

#

411

#

412

# XXX This is currently not in use because of issue6542

412

# XXX This is currently not in use because of issue6542

413

EXCLUDED = re.compile(br'.*undo\.[^/]+\.(nd?|i)$')

413

EXCLUDED = re.compile(br'.*undo\.[^/]+\.(nd?|i)$')

414

415

416

def is_revlog(f, kind, st):

416

def is_revlog(f, kind, st):

417

if kind != stat.S_IFREG:

417

if kind != stat.S_IFREG:

418

return None

418

return None

419

return revlog_type(f)

419

return revlog_type(f)

420

421

422

def revlog_type(f):

422

def revlog_type(f):

423

# XXX we need to filter `undo.` created by the transaction here, however

423

# XXX we need to filter `undo.` created by the transaction here, however

424

# being naive about it also filter revlog for `undo.*` files, leading to

424

# being naive about it also filter revlog for `undo.*` files, leading to

425

# issue6542. So we no longer use EXCLUDED.

425

# issue6542. So we no longer use EXCLUDED.

426

if f.endswith(REVLOG_FILES_MAIN_EXT):

426

if f.endswith(REVLOG_FILES_MAIN_EXT):

427

return FILEFLAGS_REVLOG_MAIN

427

return FILEFLAGS_REVLOG_MAIN

428

elif f.endswith(REVLOG_FILES_OTHER_EXT):

428

elif f.endswith(REVLOG_FILES_OTHER_EXT):

429

t = FILETYPE_FILELOG_OTHER

429

t = FILETYPE_FILELOG_OTHER

430

if f.endswith(REVLOG_FILES_VOLATILE_EXT):

430

if f.endswith(REVLOG_FILES_VOLATILE_EXT):

431

t |= FILEFLAGS_VOLATILE

431

t |= FILEFLAGS_VOLATILE

432

return t

432

return t

433

return None

433

return None

434

435

436

# the file is part of changelog data

436

# the file is part of changelog data

437

FILEFLAGS_CHANGELOG = 1 << 13

437

FILEFLAGS_CHANGELOG = 1 << 13

438

# the file is part of manifest data

438

# the file is part of manifest data

439

FILEFLAGS_MANIFESTLOG = 1 << 12

439

FILEFLAGS_MANIFESTLOG = 1 << 12

440

# the file is part of filelog data

440

# the file is part of filelog data

441

FILEFLAGS_FILELOG = 1 << 11

441

FILEFLAGS_FILELOG = 1 << 11

442

# file that are not directly part of a revlog

442

# file that are not directly part of a revlog

443

FILEFLAGS_OTHER = 1 << 10

443

FILEFLAGS_OTHER = 1 << 10

444

445

# the main entry point for a revlog

445

# the main entry point for a revlog

446

FILEFLAGS_REVLOG_MAIN = 1 << 1

446

FILEFLAGS_REVLOG_MAIN = 1 << 1

447

# a secondary file for a revlog

447

# a secondary file for a revlog

448

FILEFLAGS_REVLOG_OTHER = 1 << 0

448

FILEFLAGS_REVLOG_OTHER = 1 << 0

449

450

# files that are "volatile" and might change between listing and streaming

450

# files that are "volatile" and might change between listing and streaming

451

FILEFLAGS_VOLATILE = 1 << 20

451

FILEFLAGS_VOLATILE = 1 << 20

452

453

FILETYPE_CHANGELOG_MAIN = FILEFLAGS_CHANGELOG | FILEFLAGS_REVLOG_MAIN

453

FILETYPE_CHANGELOG_MAIN = FILEFLAGS_CHANGELOG | FILEFLAGS_REVLOG_MAIN

454

FILETYPE_CHANGELOG_OTHER = FILEFLAGS_CHANGELOG | FILEFLAGS_REVLOG_OTHER

454

FILETYPE_CHANGELOG_OTHER = FILEFLAGS_CHANGELOG | FILEFLAGS_REVLOG_OTHER

455

FILETYPE_MANIFESTLOG_MAIN = FILEFLAGS_MANIFESTLOG | FILEFLAGS_REVLOG_MAIN

455

FILETYPE_MANIFESTLOG_MAIN = FILEFLAGS_MANIFESTLOG | FILEFLAGS_REVLOG_MAIN

456

FILETYPE_MANIFESTLOG_OTHER = FILEFLAGS_MANIFESTLOG | FILEFLAGS_REVLOG_OTHER

456

FILETYPE_MANIFESTLOG_OTHER = FILEFLAGS_MANIFESTLOG | FILEFLAGS_REVLOG_OTHER

457

FILETYPE_FILELOG_MAIN = FILEFLAGS_FILELOG | FILEFLAGS_REVLOG_MAIN

457

FILETYPE_FILELOG_MAIN = FILEFLAGS_FILELOG | FILEFLAGS_REVLOG_MAIN

458

FILETYPE_FILELOG_OTHER = FILEFLAGS_FILELOG | FILEFLAGS_REVLOG_OTHER

458

FILETYPE_FILELOG_OTHER = FILEFLAGS_FILELOG | FILEFLAGS_REVLOG_OTHER

459

FILETYPE_OTHER = FILEFLAGS_OTHER

459

FILETYPE_OTHER = FILEFLAGS_OTHER

460

461

462

@attr.s(slots=True)

463

class StoreFile:

464

"""a file matching a store entry"""

465

466

unencoded_path = attr.ib()

467

_file_size = attr.ib(default=None)

468

is_volatile = attr.ib(default=False)

469

470

def file_size(self, vfs):

471

if self._file_size is None:

472

try:

473

self._file_size = vfs.stat(self.unencoded_path).st_size

474

except FileNotFoundError:

475

self._file_size = 0

476

return self._file_size

477

478

462

@attr.s(slots=True, init=False)

479

@attr.s(slots=True, init=False)

463

class BaseStoreEntry:

480

class BaseStoreEntry:

464

"""An entry in the store

481

"""An entry in the store

465

482

466

This is returned by `store.walk` and represent some data in the store."""

483

This is returned by `store.walk` and represent some data in the store."""

467

484

485

def files(self) -> List[StoreFile]:

486

raise NotImplementedError

487

468

488

469

@attr.s(slots=True, init=False)

489

@attr.s(slots=True, init=False)

470

class SimpleStoreEntry(BaseStoreEntry):

490

class SimpleStoreEntry(BaseStoreEntry):

471

"""A generic entry in the store"""

491

"""A generic entry in the store"""

472

492

473

is_revlog = False

493

is_revlog = False

474

494

475

_entry_path = attr.ib()

495

_entry_path = attr.ib()

476

_is_volatile = attr.ib(default=False)

496

_is_volatile = attr.ib(default=False)

477

_file_size = attr.ib(default=None)

497

_file_size = attr.ib(default=None)

478

_files = attr.ib(default=None)

498

_files = attr.ib(default=None)

479

499

480

def __init__(

500

def __init__(

481

self,

501

self,

482

entry_path,

502

entry_path,

483

is_volatile=False,

503

is_volatile=False,

484

file_size=None,

504

file_size=None,

485

):

505

):

486

super().__init__()

506

super().__init__()

487

self._entry_path = entry_path

507

self._entry_path = entry_path

488

self._is_volatile = is_volatile

508

self._is_volatile = is_volatile

489

self._file_size = file_size

509

self._file_size = file_size

490

self._files = None

510

self._files = None

491

511

492

def files(self):

512

def files(self) -> List[StoreFile]:

493

if self._files is None:

513

if self._files is None:

494

self._files = [

514

self._files = [

495

StoreFile(

515

StoreFile(

496

unencoded_path=self._entry_path,

516

unencoded_path=self._entry_path,

497

file_size=self._file_size,

517

file_size=self._file_size,

498

is_volatile=self._is_volatile,

518

is_volatile=self._is_volatile,

499

)

519

)

500

]

520

]

501

return self._files

521

return self._files

502

522

503

523

504

@attr.s(slots=True, init=False)

524

@attr.s(slots=True, init=False)

505

class RevlogStoreEntry(BaseStoreEntry):

525

class RevlogStoreEntry(BaseStoreEntry):

506

"""A revlog entry in the store"""

526

"""A revlog entry in the store"""

507

527

508

is_revlog = True

528

is_revlog = True

509

529

510

revlog_type = attr.ib(default=None)

530

revlog_type = attr.ib(default=None)

511

target_id = attr.ib(default=None)

531

target_id = attr.ib(default=None)

512

_path_prefix = attr.ib(default=None)

532

_path_prefix = attr.ib(default=None)

513

_details = attr.ib(default=None)

533

_details = attr.ib(default=None)

514

_files = attr.ib(default=None)

534

_files = attr.ib(default=None)

515

535

516

def __init__(

536

def __init__(

517

self,

537

self,

518

revlog_type,

538

revlog_type,

519

path_prefix,

539

path_prefix,

520

target_id,

540

target_id,

521

details,

541

details,

522

):

542

):

523

super().__init__()

543

super().__init__()

524

self.revlog_type = revlog_type

544

self.revlog_type = revlog_type

525

self.target_id = target_id

545

self.target_id = target_id

526

self._path_prefix = path_prefix

546

self._path_prefix = path_prefix

527

assert b'.i' in details, (path_prefix, details)

547

assert b'.i' in details, (path_prefix, details)

528

self._details = details

548

self._details = details

529

self._files = None

549

self._files = None

530

550

531

@property

551

@property

532

def is_changelog(self):

552

def is_changelog(self):

533

return self.revlog_type & FILEFLAGS_CHANGELOG

553

return self.revlog_type & FILEFLAGS_CHANGELOG

534

554

535

@property

555

@property

536

def is_manifestlog(self):

556

def is_manifestlog(self):

537

return self.revlog_type & FILEFLAGS_MANIFESTLOG

557

return self.revlog_type & FILEFLAGS_MANIFESTLOG

538

558

539

@property

559

@property

540

def is_filelog(self):

560

def is_filelog(self):

541

return self.revlog_type & FILEFLAGS_FILELOG

561

return self.revlog_type & FILEFLAGS_FILELOG

542

562

543

def main_file_path(self):

563

def main_file_path(self):

544

"""unencoded path of the main revlog file"""

564

"""unencoded path of the main revlog file"""

545

return self._path_prefix + b'.i'

565

return self._path_prefix + b'.i'

546

566

547

def files(self):

567

def files(self) -> List[StoreFile]:

548

if self._files is None:

568

if self._files is None:

549

self._files = []

569

self._files = []

550

for ext in sorted(self._details, key=_ext_key):

570

for ext in sorted(self._details, key=_ext_key):

551

path = self._path_prefix + ext

571

path = self._path_prefix + ext

552

data = self._details[ext]

572

data = self._details[ext]

553

self._files.append(StoreFile(unencoded_path=path, **data))

573

self._files.append(StoreFile(unencoded_path=path, **data))

554

return self._files

574

return self._files

555

575

556

def get_revlog_instance(self, repo):

576

def get_revlog_instance(self, repo):

557

"""Obtain a revlog instance from this store entry

577

"""Obtain a revlog instance from this store entry

558

578

559

An instance of the appropriate class is returned.

579

An instance of the appropriate class is returned.

560

"""

580

"""

561

if self.is_changelog:

581

if self.is_changelog:

562

return changelog.changelog(repo.svfs)

582

return changelog.changelog(repo.svfs)

563

elif self.is_manifestlog:

583

elif self.is_manifestlog:

564

mandir = self.target_id

584

mandir = self.target_id

565

return manifest.manifestrevlog(

585

return manifest.manifestrevlog(

566

repo.nodeconstants, repo.svfs, tree=mandir

586

repo.nodeconstants, repo.svfs, tree=mandir

567

)

587

)

568

else:

588

else:

569

return filelog.filelog(repo.svfs, self.target_id)

589

return filelog.filelog(repo.svfs, self.target_id)

570

590

571

591

572

@attr.s(slots=True)

573

class StoreFile:

574

"""a file matching an entry"""

575

576

unencoded_path = attr.ib()

577

_file_size = attr.ib(default=None)

578

is_volatile = attr.ib(default=False)

579

580

def file_size(self, vfs):

581

if self._file_size is None:

582

try:

583

self._file_size = vfs.stat(self.unencoded_path).st_size

584

except FileNotFoundError:

585

self._file_size = 0

586

return self._file_size

587

588

589

def _gather_revlog(files_data):

592

def _gather_revlog(files_data):

590

"""group files per revlog prefix

593

"""group files per revlog prefix

591

594

592

The returns a two level nested dict. The top level key is the revlog prefix

595

The returns a two level nested dict. The top level key is the revlog prefix

593

without extension, the second level is all the file "suffix" that were

596

without extension, the second level is all the file "suffix" that were

594

seen for this revlog and arbitrary file data as value.

597

seen for this revlog and arbitrary file data as value.

595

"""

598

"""

596

revlogs = collections.defaultdict(dict)

599

revlogs = collections.defaultdict(dict)

597

for u, value in files_data:

600

for u, value in files_data:

598

name, ext = _split_revlog_ext(u)

601

name, ext = _split_revlog_ext(u)

599

revlogs[name][ext] = value

602

revlogs[name][ext] = value

600

return sorted(revlogs.items())

603

return sorted(revlogs.items())

601

604

602

605

603

def _split_revlog_ext(filename):

606

def _split_revlog_ext(filename):

604

"""split the revlog file prefix from the variable extension"""

607

"""split the revlog file prefix from the variable extension"""

605

if filename.endswith(REVLOG_FILES_LONG_EXT):

608

if filename.endswith(REVLOG_FILES_LONG_EXT):

606

char = b'-'

609

char = b'-'

607

else:

610

else:

608

char = b'.'

611

char = b'.'

609

idx = filename.rfind(char)

612

idx = filename.rfind(char)

610

return filename[:idx], filename[idx:]

613

return filename[:idx], filename[idx:]

611

614

612

615

613

def _ext_key(ext):

616

def _ext_key(ext):

614

"""a key to order revlog suffix

617

"""a key to order revlog suffix

615

618

616

important to issue .i after other entry."""

619

important to issue .i after other entry."""

617

# the only important part of this order is to keep the `.i` last.

620

# the only important part of this order is to keep the `.i` last.

618

if ext.endswith(b'.n'):

621

if ext.endswith(b'.n'):

619

return (0, ext)

622

return (0, ext)

620

elif ext.endswith(b'.nd'):

623

elif ext.endswith(b'.nd'):

621

return (10, ext)

624

return (10, ext)

622

elif ext.endswith(b'.d'):

625

elif ext.endswith(b'.d'):

623

return (20, ext)

626

return (20, ext)

624

elif ext.endswith(b'.i'):

627

elif ext.endswith(b'.i'):

625

return (50, ext)

628

return (50, ext)

626

else:

629

else:

627

return (40, ext)

630

return (40, ext)

628

631

629

632

630

class basicstore:

633

class basicstore:

631

'''base class for local repository stores'''

634

'''base class for local repository stores'''

632

635

633

def __init__(self, path, vfstype):

636

def __init__(self, path, vfstype):

634

vfs = vfstype(path)

637

vfs = vfstype(path)

635

self.path = vfs.base

638

self.path = vfs.base

636

self.createmode = _calcmode(vfs)

639

self.createmode = _calcmode(vfs)

637

vfs.createmode = self.createmode

640

vfs.createmode = self.createmode

638

self.rawvfs = vfs

641

self.rawvfs = vfs

639

self.vfs = vfsmod.filtervfs(vfs, encodedir)

642

self.vfs = vfsmod.filtervfs(vfs, encodedir)

640

self.opener = self.vfs

643

self.opener = self.vfs

641

644

642

def join(self, f):

645

def join(self, f):

643

return self.path + b'/' + encodedir(f)

646

return self.path + b'/' + encodedir(f)

644

647

645

def _walk(self, relpath, recurse, undecodable=None):

648

def _walk(self, relpath, recurse, undecodable=None):

646

'''yields (revlog_type, unencoded, size)'''

649

'''yields (revlog_type, unencoded, size)'''

647

path = self.path

650

path = self.path

648

if relpath:

651

if relpath:

649

path += b'/' + relpath

652

path += b'/' + relpath

650

striplen = len(self.path) + 1

653

striplen = len(self.path) + 1

651

l = []

654

l = []

652

if self.rawvfs.isdir(path):

655

if self.rawvfs.isdir(path):

653

visit = [path]

656

visit = [path]

654

readdir = self.rawvfs.readdir

657

readdir = self.rawvfs.readdir

655

while visit:

658

while visit:

656

p = visit.pop()

659

p = visit.pop()

657

for f, kind, st in readdir(p, stat=True):

660

for f, kind, st in readdir(p, stat=True):

658

fp = p + b'/' + f

661

fp = p + b'/' + f

659

rl_type = is_revlog(f, kind, st)

662

rl_type = is_revlog(f, kind, st)

660

if rl_type is not None:

663

if rl_type is not None:

661

n = util.pconvert(fp[striplen:])

664

n = util.pconvert(fp[striplen:])

662

l.append((decodedir(n), (rl_type, st.st_size)))

665

l.append((decodedir(n), (rl_type, st.st_size)))

663

elif kind == stat.S_IFDIR and recurse:

666

elif kind == stat.S_IFDIR and recurse:

664

visit.append(fp)

667

visit.append(fp)

665

668

666

l.sort()

669

l.sort()

667

return l

670

return l

668

671

669

def changelog(self, trypending, concurrencychecker=None):

672

def changelog(self, trypending, concurrencychecker=None):

670

return changelog.changelog(

673

return changelog.changelog(

671

self.vfs,

674

self.vfs,

672

trypending=trypending,

675

trypending=trypending,

673

concurrencychecker=concurrencychecker,

676

concurrencychecker=concurrencychecker,

674

)

677

)

675

678

676

def manifestlog(self, repo, storenarrowmatch):

679

def manifestlog(self, repo, storenarrowmatch):

677

rootstore = manifest.manifestrevlog(repo.nodeconstants, self.vfs)

680

rootstore = manifest.manifestrevlog(repo.nodeconstants, self.vfs)

678

return manifest.manifestlog(self.vfs, repo, rootstore, storenarrowmatch)

681

return manifest.manifestlog(self.vfs, repo, rootstore, storenarrowmatch)

679

682

680

def data_entries(

683

def data_entries(

681

self, matcher=None, undecodable=None

684

self, matcher=None, undecodable=None

682

) -> Generator[BaseStoreEntry, None, None]:

685

) -> Generator[BaseStoreEntry, None, None]:

683

"""Like walk, but excluding the changelog and root manifest.

686

"""Like walk, but excluding the changelog and root manifest.

684

687

685

When [undecodable] is None, revlogs names that can't be

688

When [undecodable] is None, revlogs names that can't be

686

decoded cause an exception. When it is provided, it should

689

decoded cause an exception. When it is provided, it should

687

be a list and the filenames that can't be decoded are added

690

be a list and the filenames that can't be decoded are added

688

to it instead. This is very rarely needed."""

691

to it instead. This is very rarely needed."""

689

dirs = [

692

dirs = [

690

(b'data', FILEFLAGS_FILELOG, False),

693

(b'data', FILEFLAGS_FILELOG, False),

691

(b'meta', FILEFLAGS_MANIFESTLOG, True),

694

(b'meta', FILEFLAGS_MANIFESTLOG, True),

692

]

695

]

693

for base_dir, rl_type, strip_filename in dirs:

696

for base_dir, rl_type, strip_filename in dirs:

694

files = self._walk(base_dir, True, undecodable=undecodable)

697

files = self._walk(base_dir, True, undecodable=undecodable)

695

files = (f for f in files if f[1][0] is not None)

698

files = (f for f in files if f[1][0] is not None)

696

for revlog, details in _gather_revlog(files):

699

for revlog, details in _gather_revlog(files):

697

file_details = {}

700

file_details = {}

698

revlog_target_id = revlog.split(b'/', 1)[1]

701

revlog_target_id = revlog.split(b'/', 1)[1]

699

if strip_filename and b'/' in revlog:

702

if strip_filename and b'/' in revlog:

700

revlog_target_id = revlog_target_id.rsplit(b'/', 1)[0]

703

revlog_target_id = revlog_target_id.rsplit(b'/', 1)[0]

701

revlog_target_id += b'/'

704

revlog_target_id += b'/'

702

for ext, (t, s) in sorted(details.items()):

705

for ext, (t, s) in sorted(details.items()):

703

file_details[ext] = {

706

file_details[ext] = {

704

'is_volatile': bool(t & FILEFLAGS_VOLATILE),

707

'is_volatile': bool(t & FILEFLAGS_VOLATILE),

705

'file_size': s,

708

'file_size': s,

706

}

709

}

707

yield RevlogStoreEntry(

710

yield RevlogStoreEntry(

708

path_prefix=revlog,

711

path_prefix=revlog,

709

revlog_type=rl_type,

712

revlog_type=rl_type,

710

target_id=revlog_target_id,

713

target_id=revlog_target_id,

711

details=file_details,

714

details=file_details,

712

)

715

)

713

716

714

def top_entries(

717

def top_entries(

715

self, phase=False, obsolescence=False

718

self, phase=False, obsolescence=False

716

) -> Generator[BaseStoreEntry, None, None]:

719

) -> Generator[BaseStoreEntry, None, None]:

717

if phase and self.vfs.exists(b'phaseroots'):

720

if phase and self.vfs.exists(b'phaseroots'):

718

yield SimpleStoreEntry(

721

yield SimpleStoreEntry(

719

entry_path=b'phaseroots',

722

entry_path=b'phaseroots',

720

is_volatile=True,

723

is_volatile=True,

721

)

724

)

722

725

723

if obsolescence and self.vfs.exists(b'obsstore'):

726

if obsolescence and self.vfs.exists(b'obsstore'):

724

# XXX if we had the file size it could be non-volatile

727

# XXX if we had the file size it could be non-volatile

725

yield SimpleStoreEntry(

728

yield SimpleStoreEntry(

726

entry_path=b'obsstore',

729

entry_path=b'obsstore',

727

is_volatile=True,

730

is_volatile=True,

728

)

731

)

729

732

730

files = reversed(self._walk(b'', False))

733

files = reversed(self._walk(b'', False))

731

734

732

changelogs = collections.defaultdict(dict)

735

changelogs = collections.defaultdict(dict)

733

manifestlogs = collections.defaultdict(dict)

736

manifestlogs = collections.defaultdict(dict)

734

737

735

for u, (t, s) in files:

738

for u, (t, s) in files:

736

if u.startswith(b'00changelog'):

739

if u.startswith(b'00changelog'):

737

name, ext = _split_revlog_ext(u)

740

name, ext = _split_revlog_ext(u)

738

changelogs[name][ext] = (t, s)

741

changelogs[name][ext] = (t, s)

739

elif u.startswith(b'00manifest'):

742

elif u.startswith(b'00manifest'):

740

name, ext = _split_revlog_ext(u)

743

name, ext = _split_revlog_ext(u)

741

manifestlogs[name][ext] = (t, s)

744

manifestlogs[name][ext] = (t, s)

742

else:

745

else:

743

yield SimpleStoreEntry(

746

yield SimpleStoreEntry(

744

entry_path=u,

747

entry_path=u,

745

is_volatile=bool(t & FILEFLAGS_VOLATILE),

748

is_volatile=bool(t & FILEFLAGS_VOLATILE),

746

file_size=s,

749

file_size=s,

747

)

750

)

748

# yield manifest before changelog

751

# yield manifest before changelog

749

top_rl = [

752

top_rl = [

750

(manifestlogs, FILEFLAGS_MANIFESTLOG),

753

(manifestlogs, FILEFLAGS_MANIFESTLOG),

751

(changelogs, FILEFLAGS_CHANGELOG),

754

(changelogs, FILEFLAGS_CHANGELOG),

752

]

755

]

753

assert len(manifestlogs) <= 1

756

assert len(manifestlogs) <= 1

754

assert len(changelogs) <= 1

757

assert len(changelogs) <= 1

755

for data, revlog_type in top_rl:

758

for data, revlog_type in top_rl:

756

for revlog, details in sorted(data.items()):

759

for revlog, details in sorted(data.items()):

757

file_details = {}

760

file_details = {}

758

for ext, (t, s) in details.items():

761

for ext, (t, s) in details.items():

759

file_details[ext] = {

762

file_details[ext] = {

760

'is_volatile': bool(t & FILEFLAGS_VOLATILE),

763

'is_volatile': bool(t & FILEFLAGS_VOLATILE),

761

'file_size': s,

764

'file_size': s,

762

}

765

}

763

yield RevlogStoreEntry(

766

yield RevlogStoreEntry(

764

path_prefix=revlog,

767

path_prefix=revlog,

765

revlog_type=revlog_type,

768

revlog_type=revlog_type,

766

target_id=b'',

769

target_id=b'',

767

details=file_details,

770

details=file_details,

768

)

771

)

769

772

770

def walk(

773

def walk(

771

self, matcher=None, phase=False, obsolescence=False

774

self, matcher=None, phase=False, obsolescence=False

772

) -> Generator[BaseStoreEntry, None, None]:

775

) -> Generator[BaseStoreEntry, None, None]:

773

"""return files related to data storage (ie: revlogs)

776

"""return files related to data storage (ie: revlogs)

774

777

775

yields instance from BaseStoreEntry subclasses

778

yields instance from BaseStoreEntry subclasses

776

779

777

if a matcher is passed, storage files of only those tracked paths

780

if a matcher is passed, storage files of only those tracked paths

778

are passed with matches the matcher

781

are passed with matches the matcher

779

"""

782

"""

780

# yield data files first

783

# yield data files first

781

for x in self.data_entries(matcher):

784

for x in self.data_entries(matcher):

782

yield x

785

yield x

783

for x in self.top_entries(phase=phase, obsolescence=obsolescence):

786

for x in self.top_entries(phase=phase, obsolescence=obsolescence):

784

yield x

787

yield x

785

788

786

def copylist(self):

789

def copylist(self):

787

return _data

790

return _data

788

791

789

def write(self, tr):

792

def write(self, tr):

790

pass

793

pass

791

794

792

def invalidatecaches(self):

795

def invalidatecaches(self):

793

pass

796

pass

794

797

795

def markremoved(self, fn):

798

def markremoved(self, fn):

796

pass

799

pass

797

800

798

def __contains__(self, path):

801

def __contains__(self, path):

799

'''Checks if the store contains path'''

802

'''Checks if the store contains path'''

800

path = b"/".join((b"data", path))

803

path = b"/".join((b"data", path))

801

# file?

804

# file?

802

if self.vfs.exists(path + b".i"):

805

if self.vfs.exists(path + b".i"):

803

return True

806

return True

804

# dir?

807

# dir?

805

if not path.endswith(b"/"):

808

if not path.endswith(b"/"):

806

path = path + b"/"

809

path = path + b"/"

807

return self.vfs.exists(path)

810

return self.vfs.exists(path)

808

811

809

812

810

class encodedstore(basicstore):

813

class encodedstore(basicstore):

811

def __init__(self, path, vfstype):

814

def __init__(self, path, vfstype):

812

vfs = vfstype(path + b'/store')

815

vfs = vfstype(path + b'/store')

813

self.path = vfs.base

816

self.path = vfs.base

814

self.createmode = _calcmode(vfs)

817

self.createmode = _calcmode(vfs)

815

vfs.createmode = self.createmode

818

vfs.createmode = self.createmode

816

self.rawvfs = vfs

819

self.rawvfs = vfs

817

self.vfs = vfsmod.filtervfs(vfs, encodefilename)

820

self.vfs = vfsmod.filtervfs(vfs, encodefilename)

818

self.opener = self.vfs

821

self.opener = self.vfs

819

822

820

def _walk(self, relpath, recurse, undecodable=None):

823

def _walk(self, relpath, recurse, undecodable=None):

821

old = super()._walk(relpath, recurse)

824

old = super()._walk(relpath, recurse)

822

new = []

825

new = []

823

for f1, value in old:

826

for f1, value in old:

824

try:

827

try:

825

f2 = decodefilename(f1)

828

f2 = decodefilename(f1)

826

except KeyError:

829

except KeyError:

827

if undecodable is None:

830

if undecodable is None:

828

msg = _(b'undecodable revlog name %s') % f1

831

msg = _(b'undecodable revlog name %s') % f1

829

raise error.StorageError(msg)

832

raise error.StorageError(msg)

830

else:

833

else:

831

undecodable.append(f1)

834

undecodable.append(f1)

832

continue

835

continue

833

new.append((f2, value))

836

new.append((f2, value))

834

return new

837

return new

835

838

836

def data_entries(

839

def data_entries(

837

self, matcher=None, undecodable=None

840

self, matcher=None, undecodable=None

838

) -> Generator[BaseStoreEntry, None, None]:

841

) -> Generator[BaseStoreEntry, None, None]:

839

entries = super(encodedstore, self).data_entries(

842

entries = super(encodedstore, self).data_entries(

840

undecodable=undecodable

843

undecodable=undecodable

841

)

844

)

842

for entry in entries:

845

for entry in entries:

843

if _match_tracked_entry(entry, matcher):

846

if _match_tracked_entry(entry, matcher):

844

yield entry

847

yield entry

845

848

846

def join(self, f):

849

def join(self, f):

847

return self.path + b'/' + encodefilename(f)

850

return self.path + b'/' + encodefilename(f)

848

851

849

def copylist(self):

852

def copylist(self):

850

return [b'requires', b'00changelog.i'] + [b'store/' + f for f in _data]

853

return [b'requires', b'00changelog.i'] + [b'store/' + f for f in _data]

851

854

852

855

853

class fncache:

856

class fncache:

854

# the filename used to be partially encoded

857

# the filename used to be partially encoded

855

# hence the encodedir/decodedir dance

858

# hence the encodedir/decodedir dance

856

def __init__(self, vfs):

859

def __init__(self, vfs):

857

self.vfs = vfs

860

self.vfs = vfs

858

self._ignores = set()

861

self._ignores = set()

859

self.entries = None

862

self.entries = None

860

self._dirty = False

863

self._dirty = False

861

# set of new additions to fncache

864

# set of new additions to fncache

862

self.addls = set()

865

self.addls = set()

863

866

864

def ensureloaded(self, warn=None):

867

def ensureloaded(self, warn=None):

865

"""read the fncache file if not already read.

868

"""read the fncache file if not already read.

866

869

867

If the file on disk is corrupted, raise. If warn is provided,

870

If the file on disk is corrupted, raise. If warn is provided,

868

warn and keep going instead."""

871

warn and keep going instead."""

869

if self.entries is None:

872

if self.entries is None:

870

self._load(warn)

873

self._load(warn)

871

874

872

def _load(self, warn=None):

875

def _load(self, warn=None):

873

'''fill the entries from the fncache file'''

876

'''fill the entries from the fncache file'''

874

self._dirty = False

877

self._dirty = False

875

try:

878

try:

876

fp = self.vfs(b'fncache', mode=b'rb')

879

fp = self.vfs(b'fncache', mode=b'rb')

877

except IOError:

880

except IOError:

878

# skip nonexistent file

881

# skip nonexistent file

879

self.entries = set()

882

self.entries = set()

880

return

883

return

881

884

882

self.entries = set()

885

self.entries = set()

883

chunk = b''

886

chunk = b''

884

for c in iter(functools.partial(fp.read, fncache_chunksize), b''):

887

for c in iter(functools.partial(fp.read, fncache_chunksize), b''):

885

chunk += c

888

chunk += c

886

try:

889

try:

887

p = chunk.rindex(b'\n')

890

p = chunk.rindex(b'\n')

888

self.entries.update(decodedir(chunk[: p + 1]).splitlines())

891

self.entries.update(decodedir(chunk[: p + 1]).splitlines())

889

chunk = chunk[p + 1 :]

892

chunk = chunk[p + 1 :]

890

except ValueError:

893

except ValueError:

891

# substring '\n' not found, maybe the entry is bigger than the

894

# substring '\n' not found, maybe the entry is bigger than the

892

# chunksize, so let's keep iterating

895

# chunksize, so let's keep iterating

893

pass

896

pass

894

897

895

if chunk:

898

if chunk:

896

msg = _(b"fncache does not ends with a newline")

899

msg = _(b"fncache does not ends with a newline")

897

if warn:

900

if warn:

898

warn(msg + b'\n')

901

warn(msg + b'\n')

899

else:

902

else:

900

raise error.Abort(

903

raise error.Abort(

901

msg,

904

msg,

902

hint=_(

905

hint=_(

903

b"use 'hg debugrebuildfncache' to "

906

b"use 'hg debugrebuildfncache' to "

904

b"rebuild the fncache"

907

b"rebuild the fncache"

905

),

908

),

906

)

909

)

907

self._checkentries(fp, warn)

910

self._checkentries(fp, warn)

908

fp.close()

911

fp.close()

909

912

910

def _checkentries(self, fp, warn):

913

def _checkentries(self, fp, warn):

911

"""make sure there is no empty string in entries"""

914

"""make sure there is no empty string in entries"""

912

if b'' in self.entries:

915

if b'' in self.entries:

913

fp.seek(0)

916

fp.seek(0)

914

for n, line in enumerate(fp):

917

for n, line in enumerate(fp):

915

if not line.rstrip(b'\n'):

918

if not line.rstrip(b'\n'):

916

t = _(b'invalid entry in fncache, line %d') % (n + 1)

919

t = _(b'invalid entry in fncache, line %d') % (n + 1)

917

if warn:

920

if warn:

918

warn(t + b'\n')

921

warn(t + b'\n')

919

else:

922

else:

920

raise error.Abort(t)

923

raise error.Abort(t)

921

924

922

def write(self, tr):

925

def write(self, tr):

923

if self._dirty:

926

if self._dirty:

924

assert self.entries is not None

927

assert self.entries is not None

925

self.entries = self.entries | self.addls

928

self.entries = self.entries | self.addls

926

self.addls = set()

929

self.addls = set()

927

tr.addbackup(b'fncache')

930

tr.addbackup(b'fncache')

928

fp = self.vfs(b'fncache', mode=b'wb', atomictemp=True)

931

fp = self.vfs(b'fncache', mode=b'wb', atomictemp=True)

929

if self.entries:

932

if self.entries:

930

fp.write(encodedir(b'\n'.join(self.entries) + b'\n'))

933

fp.write(encodedir(b'\n'.join(self.entries) + b'\n'))

931

fp.close()

934

fp.close()

932

self._dirty = False

935

self._dirty = False

933

if self.addls:

936

if self.addls:

934

# if we have just new entries, let's append them to the fncache

937

# if we have just new entries, let's append them to the fncache

935

tr.addbackup(b'fncache')

938

tr.addbackup(b'fncache')

936

fp = self.vfs(b'fncache', mode=b'ab', atomictemp=True)

939

fp = self.vfs(b'fncache', mode=b'ab', atomictemp=True)

937

if self.addls:

940

if self.addls:

938

fp.write(encodedir(b'\n'.join(self.addls) + b'\n'))

941

fp.write(encodedir(b'\n'.join(self.addls) + b'\n'))

939

fp.close()

942

fp.close()

940

self.entries = None

943

self.entries = None

941

self.addls = set()

944

self.addls = set()

942

945

943

def addignore(self, fn):

946

def addignore(self, fn):

944

self._ignores.add(fn)

947

self._ignores.add(fn)

945

948

946

def add(self, fn):

949

def add(self, fn):

947

if fn in self._ignores:

950

if fn in self._ignores:

948

return

951

return

949

if self.entries is None:

952

if self.entries is None:

950

self._load()

953

self._load()

951

if fn not in self.entries:

954

if fn not in self.entries:

952

self.addls.add(fn)

955

self.addls.add(fn)

953

956

954

def remove(self, fn):

957

def remove(self, fn):

955

if self.entries is None:

958

if self.entries is None:

956

self._load()

959

self._load()

957

if fn in self.addls:

960

if fn in self.addls:

958

self.addls.remove(fn)

961

self.addls.remove(fn)

959

return

962

return

960

try:

963

try:

961

self.entries.remove(fn)

964

self.entries.remove(fn)

962

self._dirty = True

965

self._dirty = True

963

except KeyError:

966

except KeyError:

964

pass

967

pass

965

968

966

def __contains__(self, fn):

969

def __contains__(self, fn):

967

if fn in self.addls:

970

if fn in self.addls:

968

return True

971

return True

969

if self.entries is None:

972

if self.entries is None:

970

self._load()

973

self._load()

971

return fn in self.entries

974

return fn in self.entries

972

975

973

def __iter__(self):

976

def __iter__(self):

974

if self.entries is None:

977

if self.entries is None:

975

self._load()

978

self._load()

976

return iter(self.entries | self.addls)

979

return iter(self.entries | self.addls)

977

980

978

981

979

class _fncachevfs(vfsmod.proxyvfs):

982

class _fncachevfs(vfsmod.proxyvfs):

980

def __init__(self, vfs, fnc, encode):

983

def __init__(self, vfs, fnc, encode):

981

vfsmod.proxyvfs.__init__(self, vfs)

984

vfsmod.proxyvfs.__init__(self, vfs)

982

self.fncache = fnc

985

self.fncache = fnc

983

self.encode = encode

986

self.encode = encode

984

987

985

def __call__(self, path, mode=b'r', *args, **kw):

988

def __call__(self, path, mode=b'r', *args, **kw):

986

encoded = self.encode(path)

989

encoded = self.encode(path)

987

if (

990

if (

988

mode not in (b'r', b'rb')

991

mode not in (b'r', b'rb')

989

and (path.startswith(b'data/') or path.startswith(b'meta/'))

992

and (path.startswith(b'data/') or path.startswith(b'meta/'))

990

and revlog_type(path) is not None

993

and revlog_type(path) is not None

991

):

994

):

992

# do not trigger a fncache load when adding a file that already is

995

# do not trigger a fncache load when adding a file that already is

993

# known to exist.

996

# known to exist.

994

notload = self.fncache.entries is None and self.vfs.exists(encoded)

997

notload = self.fncache.entries is None and self.vfs.exists(encoded)

995

if notload and b'r+' in mode and not self.vfs.stat(encoded).st_size:

998

if notload and b'r+' in mode and not self.vfs.stat(encoded).st_size:

996

# when appending to an existing file, if the file has size zero,

999

# when appending to an existing file, if the file has size zero,

997

# it should be considered as missing. Such zero-size files are

1000

# it should be considered as missing. Such zero-size files are

998

# the result of truncation when a transaction is aborted.

1001

# the result of truncation when a transaction is aborted.

999

notload = False

1002

notload = False

1000

if not notload:

1003

if not notload:

1001

self.fncache.add(path)

1004

self.fncache.add(path)

1002

return self.vfs(encoded, mode, *args, **kw)

1005

return self.vfs(encoded, mode, *args, **kw)

1003

1006

1004

def join(self, path):

1007

def join(self, path):

1005

if path:

1008

if path:

1006

return self.vfs.join(self.encode(path))

1009

return self.vfs.join(self.encode(path))

1007

else:

1010

else:

1008

return self.vfs.join(path)

1011

return self.vfs.join(path)

1009

1012

1010

def register_file(self, path):

1013

def register_file(self, path):

1011

"""generic hook point to lets fncache steer its stew"""

1014

"""generic hook point to lets fncache steer its stew"""

1012

if path.startswith(b'data/') or path.startswith(b'meta/'):

1015

if path.startswith(b'data/') or path.startswith(b'meta/'):

1013

self.fncache.add(path)

1016

self.fncache.add(path)

1014

1017

1015

1018

1016

class fncachestore(basicstore):

1019

class fncachestore(basicstore):

1017

def __init__(self, path, vfstype, dotencode):

1020

def __init__(self, path, vfstype, dotencode):

1018

if dotencode:

1021

if dotencode:

1019

encode = _pathencode

1022

encode = _pathencode

1020

else:

1023

else:

1021

encode = _plainhybridencode

1024

encode = _plainhybridencode

1022

self.encode = encode

1025

self.encode = encode

1023

vfs = vfstype(path + b'/store')

1026

vfs = vfstype(path + b'/store')

1024

self.path = vfs.base

1027

self.path = vfs.base

1025

self.pathsep = self.path + b'/'

1028

self.pathsep = self.path + b'/'

1026

self.createmode = _calcmode(vfs)

1029

self.createmode = _calcmode(vfs)

1027

vfs.createmode = self.createmode

1030

vfs.createmode = self.createmode

1028

self.rawvfs = vfs

1031

self.rawvfs = vfs

1029

fnc = fncache(vfs)

1032

fnc = fncache(vfs)

1030

self.fncache = fnc

1033

self.fncache = fnc

1031

self.vfs = _fncachevfs(vfs, fnc, encode)

1034

self.vfs = _fncachevfs(vfs, fnc, encode)

1032

self.opener = self.vfs

1035

self.opener = self.vfs

1033

1036

1034

def join(self, f):

1037

def join(self, f):

1035

return self.pathsep + self.encode(f)

1038

return self.pathsep + self.encode(f)

1036

1039

1037

def getsize(self, path):

1040

def getsize(self, path):

1038

return self.rawvfs.stat(path).st_size

1041

return self.rawvfs.stat(path).st_size

1039

1042

1040

def data_entries(

1043

def data_entries(

1041

self, matcher=None, undecodable=None

1044

self, matcher=None, undecodable=None

1042

) -> Generator[BaseStoreEntry, None, None]:

1045

) -> Generator[BaseStoreEntry, None, None]:

1043

files = ((f, revlog_type(f)) for f in self.fncache)

1046

files = ((f, revlog_type(f)) for f in self.fncache)

1044

# Note: all files in fncache should be revlog related, However the

1047

# Note: all files in fncache should be revlog related, However the

1045

# fncache might contains such file added by previous version of

1048

# fncache might contains such file added by previous version of

1046

# Mercurial.

1049

# Mercurial.

1047

files = (f for f in files if f[1] is not None)

1050

files = (f for f in files if f[1] is not None)

1048

by_revlog = _gather_revlog(files)

1051

by_revlog = _gather_revlog(files)

1049

for revlog, details in by_revlog:

1052

for revlog, details in by_revlog:

1050

file_details = {}

1053

file_details = {}

1051

if revlog.startswith(b'data/'):

1054

if revlog.startswith(b'data/'):

1052

rl_type = FILEFLAGS_FILELOG

1055

rl_type = FILEFLAGS_FILELOG

1053

revlog_target_id = revlog.split(b'/', 1)[1]

1056

revlog_target_id = revlog.split(b'/', 1)[1]

1054

elif revlog.startswith(b'meta/'):

1057

elif revlog.startswith(b'meta/'):

1055

rl_type = FILEFLAGS_MANIFESTLOG

1058

rl_type = FILEFLAGS_MANIFESTLOG

1056

# drop the initial directory and the `00manifest` file part

1059

# drop the initial directory and the `00manifest` file part

1057

tmp = revlog.split(b'/', 1)[1]

1060

tmp = revlog.split(b'/', 1)[1]

1058

revlog_target_id = tmp.rsplit(b'/', 1)[0] + b'/'

1061

revlog_target_id = tmp.rsplit(b'/', 1)[0] + b'/'

1059

else:

1062

else:

1060

# unreachable

1063

# unreachable

1061

assert False, revlog

1064

assert False, revlog

1062

for ext, t in details.items():

1065

for ext, t in details.items():

1063

file_details[ext] = {

1066

file_details[ext] = {

1064

'is_volatile': bool(t & FILEFLAGS_VOLATILE),

1067

'is_volatile': bool(t & FILEFLAGS_VOLATILE),

1065

}

1068

}

1066

entry = RevlogStoreEntry(

1069

entry = RevlogStoreEntry(

1067

path_prefix=revlog,

1070

path_prefix=revlog,

1068

revlog_type=rl_type,

1071

revlog_type=rl_type,

1069

target_id=revlog_target_id,

1072

target_id=revlog_target_id,

1070

details=file_details,

1073

details=file_details,

1071

)

1074

)

1072

if _match_tracked_entry(entry, matcher):

1075

if _match_tracked_entry(entry, matcher):

1073

yield entry

1076

yield entry

1074

1077

1075

def copylist(self):

1078

def copylist(self):

1076

d = (

1079

d = (

1077

b'bookmarks',

1080

b'bookmarks',

1078

b'narrowspec',

1081

b'narrowspec',

1079

b'data',

1082

b'data',

1080

b'meta',

1083

b'meta',

1081

b'dh',

1084

b'dh',

1082

b'fncache',

1085

b'fncache',

1083

b'phaseroots',

1086

b'phaseroots',

1084

b'obsstore',

1087

b'obsstore',

1085

b'00manifest.d',

1088

b'00manifest.d',

1086

b'00manifest.i',

1089

b'00manifest.i',

1087

b'00changelog.d',

1090

b'00changelog.d',

1088

b'00changelog.i',

1091

b'00changelog.i',

1089

b'requires',

1092

b'requires',

1090

)

1093

)

1091

return [b'requires', b'00changelog.i'] + [b'store/' + f for f in d]

1094

return [b'requires', b'00changelog.i'] + [b'store/' + f for f in d]

1092

1095

1093

def write(self, tr):

1096

def write(self, tr):

1094

self.fncache.write(tr)

1097

self.fncache.write(tr)

1095

1098

1096

def invalidatecaches(self):

1099

def invalidatecaches(self):

1097

self.fncache.entries = None

1100

self.fncache.entries = None

1098

self.fncache.addls = set()

1101

self.fncache.addls = set()

1099

1102

1100

def markremoved(self, fn):

1103

def markremoved(self, fn):

1101

self.fncache.remove(fn)

1104

self.fncache.remove(fn)

1102

1105

1103

def _exists(self, f):

1106

def _exists(self, f):

1104

ef = self.encode(f)

1107

ef = self.encode(f)

1105

try:

1108

try:

1106

self.getsize(ef)

1109

self.getsize(ef)

1107

return True

1110

return True

1108

except FileNotFoundError:

1111

except FileNotFoundError:

1109

return False

1112

return False

1110

1113

1111

def __contains__(self, path):

1114

def __contains__(self, path):

1112

'''Checks if the store contains path'''

1115

'''Checks if the store contains path'''

1113

path = b"/".join((b"data", path))

1116

path = b"/".join((b"data", path))

1114

# check for files (exact match)

1117

# check for files (exact match)

1115

e = path + b'.i'

1118

e = path + b'.i'

1116

if e in self.fncache and self._exists(e):

1119

if e in self.fncache and self._exists(e):

1117

return True

1120

return True

1118

# now check for directories (prefix match)

1121

# now check for directories (prefix match)

1119

if not path.endswith(b'/'):

1122

if not path.endswith(b'/'):

1120

path += b'/'

1123

path += b'/'

1121

for e in self.fncache:

1124

for e in self.fncache:

1122

if e.startswith(path) and self._exists(e):

1125

if e.startswith(path) and self._exists(e):

1123

return True

1126

return True

1124

return False

1127

return False

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages

             # store.py - repository store handling for Mercurial
             #
             # Copyright 2008 Olivia Mackall <olivia@selenic.com>
             #
             # This software may be used and distributed according to the terms of the
             # GNU General Public License version 2 or any later version.
             import collections
             import functools
             import os
             import re
             import stat
-            from typing import Generator
+            from typing import Generator, List
             from .i18n import _
             from .pycompat import getattr
             from .thirdparty import attr
             from .node import hex
             from . import (
                 changelog,
                 error,
                 filelog,
                 manifest,
                 policy,
                 pycompat,
                 util,
                 vfs as vfsmod,
             )
             from .utils import hashutil
             parsers = policy.importmod('parsers')
             # how much bytes should be read from fncache in one read
             # It is done to prevent loading large fncache files into memory
             fncache_chunksize = 10 ** 6
             def _match_tracked_entry(entry, matcher):
                 """parses a fncache entry and returns whether the entry is tracking a path
                 matched by matcher or not.
                 If matcher is None, returns True"""
                 if matcher is None:
                     return True
                 if entry.is_filelog:
                     return matcher(entry.target_id)
                 elif entry.is_manifestlog:
                     return matcher.visitdir(entry.target_id.rstrip(b'/'))
                 raise error.ProgrammingError(b"cannot process entry %r" % entry)
             # This avoids a collision between a file named foo and a dir named
             # foo.i or foo.d
             def _encodedir(path):
                 """
                 >>> _encodedir(b'data/foo.i')
                 'data/foo.i'
                 >>> _encodedir(b'data/foo.i/bla.i')
                 'data/foo.i.hg/bla.i'
                 >>> _encodedir(b'data/foo.i.hg/bla.i')
                 'data/foo.i.hg.hg/bla.i'
                 >>> _encodedir(b'data/foo.i\\ndata/foo.i/bla.i\\ndata/foo.i.hg/bla.i\\n')
                 'data/foo.i\\ndata/foo.i.hg/bla.i\\ndata/foo.i.hg.hg/bla.i\\n'
                 """
                 return (
                     path.replace(b".hg/", b".hg.hg/")
                     .replace(b".i/", b".i.hg/")
                     .replace(b".d/", b".d.hg/")
                 )
             encodedir = getattr(parsers, 'encodedir', _encodedir)
             def decodedir(path):
                 """
                 >>> decodedir(b'data/foo.i')
                 'data/foo.i'
                 >>> decodedir(b'data/foo.i.hg/bla.i')
                 'data/foo.i/bla.i'
                 >>> decodedir(b'data/foo.i.hg.hg/bla.i')
                 'data/foo.i.hg/bla.i'
                 """
                 if b".hg/" not in path:
                     return path
                 return (
                     path.replace(b".d.hg/", b".d/")
                     .replace(b".i.hg/", b".i/")
                     .replace(b".hg.hg/", b".hg/")
                 )
             def _reserved():
                 """characters that are problematic for filesystems
                 * ascii escapes (0..31)
                 * ascii hi (126..255)
                 * windows specials
                 these characters will be escaped by encodefunctions
                 """
                 winreserved = [ord(x) for x in u'\\:*?"<>|']
                 for x in range(32):
                     yield x
                 for x in range(126, 256):
                     yield x
                 for x in winreserved:
                     yield x
             def _buildencodefun():
                 """
                 >>> enc, dec = _buildencodefun()
                 >>> enc(b'nothing/special.txt')
                 'nothing/special.txt'
                 >>> dec(b'nothing/special.txt')
                 'nothing/special.txt'
                 >>> enc(b'HELLO')
                 '_h_e_l_l_o'
                 >>> dec(b'_h_e_l_l_o')
                 'HELLO'
                 >>> enc(b'hello:world?')
                 'hello~3aworld~3f'
                 >>> dec(b'hello~3aworld~3f')
                 'hello:world?'
                 >>> enc(b'the\\x07quick\\xADshot')
                 'the~07quick~adshot'
                 >>> dec(b'the~07quick~adshot')
                 'the\\x07quick\\xadshot'
                 """
                 e = b'_'
                 xchr = pycompat.bytechr
                 asciistr = list(map(xchr, range(127)))
                 capitals = list(range(ord(b"A"), ord(b"Z") + 1))
                 cmap = {x: x for x in asciistr}
                 for x in _reserved():
                     cmap[xchr(x)] = b"~%02x" % x
                 for x in capitals + [ord(e)]:
                     cmap[xchr(x)] = e + xchr(x).lower()
                 dmap = {}
                 for k, v in cmap.items():
                     dmap[v] = k
                 def decode(s):
                     i = 0
                     while i < len(s):
                         for l in range(1, 4):
                             try:
                                 yield dmap[s[i : i + l]]
                                 i += l
                                 break
                             except KeyError:
                                 pass
                         else:
                             raise KeyError
                 return (
                     lambda s: b''.join([cmap[s[c : c + 1]] for c in range(len(s))]),
                     lambda s: b''.join(list(decode(s))),
                 )
             _encodefname, _decodefname = _buildencodefun()
             def encodefilename(s):
                 """
                 >>> encodefilename(b'foo.i/bar.d/bla.hg/hi:world?/HELLO')
                 'foo.i.hg/bar.d.hg/bla.hg.hg/hi~3aworld~3f/_h_e_l_l_o'
                 """
                 return _encodefname(encodedir(s))
             def decodefilename(s):
                 """
                 >>> decodefilename(b'foo.i.hg/bar.d.hg/bla.hg.hg/hi~3aworld~3f/_h_e_l_l_o')
                 'foo.i/bar.d/bla.hg/hi:world?/HELLO'
                 """
                 return decodedir(_decodefname(s))
             def _buildlowerencodefun():
                 """
                 >>> f = _buildlowerencodefun()
                 >>> f(b'nothing/special.txt')
                 'nothing/special.txt'
                 >>> f(b'HELLO')
                 'hello'
                 >>> f(b'hello:world?')
                 'hello~3aworld~3f'
                 >>> f(b'the\\x07quick\\xADshot')
                 'the~07quick~adshot'
                 """
                 xchr = pycompat.bytechr
                 cmap = {xchr(x): xchr(x) for x in range(127)}
                 for x in _reserved():
                     cmap[xchr(x)] = b"~%02x" % x
                 for x in range(ord(b"A"), ord(b"Z") + 1):
                     cmap[xchr(x)] = xchr(x).lower()
                 def lowerencode(s):
                     return b"".join([cmap[c] for c in pycompat.iterbytestr(s)])
                 return lowerencode
             lowerencode = getattr(parsers, 'lowerencode', None) or _buildlowerencodefun()
             # Windows reserved names: con, prn, aux, nul, com1..com9, lpt1..lpt9
             _winres3 = (b'aux', b'con', b'prn', b'nul')  # length 3
             _winres4 = (b'com', b'lpt')  # length 4 (with trailing 1..9)
             def _auxencode(path, dotencode):
                 """
                 Encodes filenames containing names reserved by Windows or which end in
                 period or space. Does not touch other single reserved characters c.
                 Specifically, c in '\\:*?"<>|' or ord(c) <= 31 are *not* encoded here.
                 Additionally encodes space or period at the beginning, if dotencode is
                 True. Parameter path is assumed to be all lowercase.
                 A segment only needs encoding if a reserved name appears as a
                 basename (e.g. "aux", "aux.foo"). A directory or file named "foo.aux"
                 doesn't need encoding.
                 >>> s = b'.foo/aux.txt/txt.aux/con/prn/nul/foo.'
                 >>> _auxencode(s.split(b'/'), True)
                 ['~2efoo', 'au~78.txt', 'txt.aux', 'co~6e', 'pr~6e', 'nu~6c', 'foo~2e']
                 >>> s = b'.com1com2/lpt9.lpt4.lpt1/conprn/com0/lpt0/foo.'
                 >>> _auxencode(s.split(b'/'), False)
                 ['.com1com2', 'lp~749.lpt4.lpt1', 'conprn', 'com0', 'lpt0', 'foo~2e']
                 >>> _auxencode([b'foo. '], True)
                 ['foo.~20']
                 >>> _auxencode([b' .foo'], True)
                 ['~20.foo']
                 """
                 for i, n in enumerate(path):
                     if not n:
                         continue
                     if dotencode and n[0] in b'. ':
                         n = b"~%02x" % ord(n[0:1]) + n[1:]
                         path[i] = n
                     else:
                         l = n.find(b'.')
                         if l == -1:
                             l = len(n)
                         if (l == 3 and n[:3] in _winres3) or (
                             l == 4
                             and n[3:4] <= b'9'
                             and n[3:4] >= b'1'
                             and n[:3] in _winres4
                         ):
                             # encode third letter ('aux' -> 'au~78')
                             ec = b"~%02x" % ord(n[2:3])
                             n = n[0:2] + ec + n[3:]
                             path[i] = n
                     if n[-1] in b'. ':
                         # encode last period or space ('foo...' -> 'foo..~2e')
                         path[i] = n[:-1] + b"~%02x" % ord(n[-1:])
                 return path
             _maxstorepathlen = 120
             _dirprefixlen = 8
             _maxshortdirslen = 8 * (_dirprefixlen + 1) - 4
             def _hashencode(path, dotencode):
                 digest = hex(hashutil.sha1(path).digest())
                 le = lowerencode(path[5:]).split(b'/')  # skips prefix 'data/' or 'meta/'
                 parts = _auxencode(le, dotencode)
                 basename = parts[-1]
                 _root, ext = os.path.splitext(basename)
                 sdirs = []
                 sdirslen = 0
                 for p in parts[:-1]:
                     d = p[:_dirprefixlen]
                     if d[-1] in b'. ':
                         # Windows can't access dirs ending in period or space
                         d = d[:-1] + b'_'
                     if sdirslen == 0:
                         t = len(d)
                     else:
                         t = sdirslen + 1 + len(d)
                         if t > _maxshortdirslen:
                             break
                     sdirs.append(d)
                     sdirslen = t
                 dirs = b'/'.join(sdirs)
                 if len(dirs) > 0:
                     dirs += b'/'
                 res = b'dh/' + dirs + digest + ext
                 spaceleft = _maxstorepathlen - len(res)
                 if spaceleft > 0:
                     filler = basename[:spaceleft]
                     res = b'dh/' + dirs + filler + digest + ext
                 return res
             def _hybridencode(path, dotencode):
                 """encodes path with a length limit
                 Encodes all paths that begin with 'data/', according to the following.
                 Default encoding (reversible):
                 Encodes all uppercase letters 'X' as '_x'. All reserved or illegal
                 characters are encoded as '~xx', where xx is the two digit hex code
                 of the character (see encodefilename).
                 Relevant path components consisting of Windows reserved filenames are
                 masked by encoding the third character ('aux' -> 'au~78', see _auxencode).
                 Hashed encoding (not reversible):
                 If the default-encoded path is longer than _maxstorepathlen, a
                 non-reversible hybrid hashing of the path is done instead.
                 This encoding uses up to _dirprefixlen characters of all directory
                 levels of the lowerencoded path, but not more levels than can fit into
                 _maxshortdirslen.
                 Then follows the filler followed by the sha digest of the full path.
                 The filler is the beginning of the basename of the lowerencoded path
                 (the basename is everything after the last path separator). The filler
                 is as long as possible, filling in characters from the basename until
                 the encoded path has _maxstorepathlen characters (or all chars of the
                 basename have been taken).
                 The extension (e.g. '.i' or '.d') is preserved.
                 The string 'data/' at the beginning is replaced with 'dh/', if the hashed
                 encoding was used.
                 """
                 path = encodedir(path)
                 ef = _encodefname(path).split(b'/')
                 res = b'/'.join(_auxencode(ef, dotencode))
                 if len(res) > _maxstorepathlen:
                     res = _hashencode(path, dotencode)
                 return res
             def _pathencode(path):
                 de = encodedir(path)
                 if len(path) > _maxstorepathlen:
                     return _hashencode(de, True)
                 ef = _encodefname(de).split(b'/')
                 res = b'/'.join(_auxencode(ef, True))
                 if len(res) > _maxstorepathlen:
                     return _hashencode(de, True)
                 return res
             _pathencode = getattr(parsers, 'pathencode', _pathencode)
             def _plainhybridencode(f):
                 return _hybridencode(f, False)
             def _calcmode(vfs):
                 try:
                     # files in .hg/ will be created using this mode
                     mode = vfs.stat().st_mode
                     # avoid some useless chmods
                     if (0o777 & ~util.umask) == (0o777 & mode):
                         mode = None
                 except OSError:
                     mode = None
                 return mode
             _data = [
                 b'bookmarks',
                 b'narrowspec',
                 b'data',
                 b'meta',
                 b'00manifest.d',
                 b'00manifest.i',
                 b'00changelog.d',
                 b'00changelog.i',
                 b'phaseroots',
                 b'obsstore',
                 b'requires',
             ]
             REVLOG_FILES_MAIN_EXT = (b'.i',)
             REVLOG_FILES_OTHER_EXT = (
                 b'.idx',
                 b'.d',
                 b'.dat',
                 b'.n',
                 b'.nd',
                 b'.sda',
             )
             # file extension that also use a `-SOMELONGIDHASH.ext` form
             REVLOG_FILES_LONG_EXT = (
                 b'.nd',
                 b'.idx',
                 b'.dat',
                 b'.sda',
             )
             # files that are "volatile" and might change between listing and streaming
             #
             # note: the ".nd" file are nodemap data and won't "change" but they might be
             # deleted.
             REVLOG_FILES_VOLATILE_EXT = (b'.n', b'.nd')
             # some exception to the above matching
             #
             # XXX This is currently not in use because of issue6542
             EXCLUDED = re.compile(br'.*undo\.[^/]+\.(nd?|i)$')
             def is_revlog(f, kind, st):
                 if kind != stat.S_IFREG:
                     return None
                 return revlog_type(f)
             def revlog_type(f):
                 # XXX we need to filter `undo.` created by the transaction here, however
                 # being naive about it also filter revlog for `undo.*` files, leading to
                 # issue6542. So we no longer use EXCLUDED.
                 if f.endswith(REVLOG_FILES_MAIN_EXT):
                     return FILEFLAGS_REVLOG_MAIN
                 elif f.endswith(REVLOG_FILES_OTHER_EXT):
                     t = FILETYPE_FILELOG_OTHER
                     if f.endswith(REVLOG_FILES_VOLATILE_EXT):
                         t |= FILEFLAGS_VOLATILE
                     return t
                 return None
             # the file is part of changelog data
             FILEFLAGS_CHANGELOG = 1 << 13
             # the file is part of manifest data
             FILEFLAGS_MANIFESTLOG = 1 << 12
             # the file is part of filelog data
             FILEFLAGS_FILELOG = 1 << 11
             # file that are not directly part of a revlog
             FILEFLAGS_OTHER = 1 << 10
             # the main entry point for a revlog
             FILEFLAGS_REVLOG_MAIN = 1 << 1
             # a secondary file for a revlog
             FILEFLAGS_REVLOG_OTHER = 1 << 0
             # files that are "volatile" and might change between listing and streaming
             FILEFLAGS_VOLATILE = 1 << 20
             FILETYPE_CHANGELOG_MAIN = FILEFLAGS_CHANGELOG | FILEFLAGS_REVLOG_MAIN
             FILETYPE_CHANGELOG_OTHER = FILEFLAGS_CHANGELOG | FILEFLAGS_REVLOG_OTHER
             FILETYPE_MANIFESTLOG_MAIN = FILEFLAGS_MANIFESTLOG | FILEFLAGS_REVLOG_MAIN
             FILETYPE_MANIFESTLOG_OTHER = FILEFLAGS_MANIFESTLOG | FILEFLAGS_REVLOG_OTHER
             FILETYPE_FILELOG_MAIN = FILEFLAGS_FILELOG | FILEFLAGS_REVLOG_MAIN
             FILETYPE_FILELOG_OTHER = FILEFLAGS_FILELOG | FILEFLAGS_REVLOG_OTHER
             FILETYPE_OTHER = FILEFLAGS_OTHER
+            @attr.s(slots=True)
+            class StoreFile:
+                """a file matching a store entry"""
+                unencoded_path = attr.ib()
+                _file_size = attr.ib(default=None)
+                is_volatile = attr.ib(default=False)
+                def file_size(self, vfs):
+                    if self._file_size is None:
+                        try:
+                            self._file_size = vfs.stat(self.unencoded_path).st_size
+                        except FileNotFoundError:
+                            self._file_size = 0
+                    return self._file_size
             @attr.s(slots=True, init=False)
             class BaseStoreEntry:
                 """An entry in the store
                 This is returned by `store.walk` and represent some data in the store."""
+                def files(self) -> List[StoreFile]:
+                    raise NotImplementedError
             @attr.s(slots=True, init=False)
             class SimpleStoreEntry(BaseStoreEntry):
                 """A generic entry in the store"""
                 is_revlog = False
                 _entry_path = attr.ib()
                 _is_volatile = attr.ib(default=False)
                 _file_size = attr.ib(default=None)
                 _files = attr.ib(default=None)
                 def __init__(
                     self,
                     entry_path,
                     is_volatile=False,
                     file_size=None,
                 ):
                     super().__init__()
                     self._entry_path = entry_path
                     self._is_volatile = is_volatile
                     self._file_size = file_size
                     self._files = None
-                def files(self):
+                def files(self) -> List[StoreFile]:
                     if self._files is None:
                         self._files = [
                             StoreFile(
                                 unencoded_path=self._entry_path,
                                 file_size=self._file_size,
                                 is_volatile=self._is_volatile,
                             )
                         ]
                     return self._files
             @attr.s(slots=True, init=False)
             class RevlogStoreEntry(BaseStoreEntry):
                 """A revlog entry in the store"""
                 is_revlog = True
                 revlog_type = attr.ib(default=None)
                 target_id = attr.ib(default=None)
                 _path_prefix = attr.ib(default=None)
                 _details = attr.ib(default=None)
                 _files = attr.ib(default=None)
                 def __init__(
                     self,
                     revlog_type,
                     path_prefix,
                     target_id,
                     details,
                 ):
                     super().__init__()
                     self.revlog_type = revlog_type
                     self.target_id = target_id
                     self._path_prefix = path_prefix
                     assert b'.i' in details, (path_prefix, details)
                     self._details = details
                     self._files = None
                 @property
                 def is_changelog(self):
                     return self.revlog_type & FILEFLAGS_CHANGELOG
                 @property
                 def is_manifestlog(self):
                     return self.revlog_type & FILEFLAGS_MANIFESTLOG
                 @property
                 def is_filelog(self):
                     return self.revlog_type & FILEFLAGS_FILELOG
                 def main_file_path(self):
                     """unencoded path of the main revlog file"""
                     return self._path_prefix + b'.i'
-                def files(self):
+                def files(self) -> List[StoreFile]:
                     if self._files is None:
                         self._files = []
                         for ext in sorted(self._details, key=_ext_key):
                             path = self._path_prefix + ext
                             data = self._details[ext]
                             self._files.append(StoreFile(unencoded_path=path, **data))
                     return self._files
                 def get_revlog_instance(self, repo):
                     """Obtain a revlog instance from this store entry
                     An instance of the appropriate class is returned.
                     """
                     if self.is_changelog:
                         return changelog.changelog(repo.svfs)
                     elif self.is_manifestlog:
                         mandir = self.target_id
                         return manifest.manifestrevlog(
                             repo.nodeconstants, repo.svfs, tree=mandir
                         )
                     else:
                         return filelog.filelog(repo.svfs, self.target_id)
-            @attr.s(slots=True)
-            class StoreFile:
-                """a file matching an entry"""
-                unencoded_path = attr.ib()
-                _file_size = attr.ib(default=None)
-                is_volatile = attr.ib(default=False)
-                def file_size(self, vfs):
-                    if self._file_size is None:
-                        try:
-                            self._file_size = vfs.stat(self.unencoded_path).st_size
-                        except FileNotFoundError:
-                            self._file_size = 0
-                    return self._file_size
             def _gather_revlog(files_data):
                 """group files per revlog prefix
                 The returns a two level nested dict. The top level key is the revlog prefix
                 without extension, the second level is all the file "suffix" that were
                 seen for this revlog and arbitrary file data as value.
                 """
                 revlogs = collections.defaultdict(dict)
                 for u, value in files_data:
                     name, ext = _split_revlog_ext(u)
                     revlogs[name][ext] = value
                 return sorted(revlogs.items())
             def _split_revlog_ext(filename):
                 """split the revlog file prefix from the variable extension"""
                 if filename.endswith(REVLOG_FILES_LONG_EXT):
                     char = b'-'
                 else:
                     char = b'.'
                 idx = filename.rfind(char)
                 return filename[:idx], filename[idx:]
             def _ext_key(ext):
                 """a key to order revlog suffix
                 important to issue .i after other entry."""
                 # the only important part of this order is to keep the `.i` last.
                 if ext.endswith(b'.n'):
                     return (0, ext)
                 elif ext.endswith(b'.nd'):
                     return (10, ext)
                 elif ext.endswith(b'.d'):
                     return (20, ext)
                 elif ext.endswith(b'.i'):
                     return (50, ext)
                 else:
                     return (40, ext)
             class basicstore:
                 '''base class for local repository stores'''
                 def __init__(self, path, vfstype):
                     vfs = vfstype(path)
                     self.path = vfs.base
                     self.createmode = _calcmode(vfs)
                     vfs.createmode = self.createmode
                     self.rawvfs = vfs
                     self.vfs = vfsmod.filtervfs(vfs, encodedir)
                     self.opener = self.vfs
                 def join(self, f):
                     return self.path + b'/' + encodedir(f)
                 def _walk(self, relpath, recurse, undecodable=None):
                     '''yields (revlog_type, unencoded, size)'''
                     path = self.path
                     if relpath:
                         path += b'/' + relpath
                     striplen = len(self.path) + 1
                     l = []
                     if self.rawvfs.isdir(path):
                         visit = [path]
                         readdir = self.rawvfs.readdir
                         while visit:
                             p = visit.pop()
                             for f, kind, st in readdir(p, stat=True):
                                 fp = p + b'/' + f
                                 rl_type = is_revlog(f, kind, st)
                                 if rl_type is not None:
                                     n = util.pconvert(fp[striplen:])
                                     l.append((decodedir(n), (rl_type, st.st_size)))
                                 elif kind == stat.S_IFDIR and recurse:
                                     visit.append(fp)
                     l.sort()
                     return l
                 def changelog(self, trypending, concurrencychecker=None):
                     return changelog.changelog(
                         self.vfs,
                         trypending=trypending,
                         concurrencychecker=concurrencychecker,
                     )
                 def manifestlog(self, repo, storenarrowmatch):
                     rootstore = manifest.manifestrevlog(repo.nodeconstants, self.vfs)
                     return manifest.manifestlog(self.vfs, repo, rootstore, storenarrowmatch)
                 def data_entries(
                     self, matcher=None, undecodable=None
                 ) -> Generator[BaseStoreEntry, None, None]:
                     """Like walk, but excluding the changelog and root manifest.
                     When [undecodable] is None, revlogs names that can't be
                     decoded cause an exception. When it is provided, it should
                     be a list and the filenames that can't be decoded are added
                     to it instead. This is very rarely needed."""
                     dirs = [
                         (b'data', FILEFLAGS_FILELOG, False),
                         (b'meta', FILEFLAGS_MANIFESTLOG, True),
                     ]
                     for base_dir, rl_type, strip_filename in dirs:
                         files = self._walk(base_dir, True, undecodable=undecodable)
                         files = (f for f in files if f[1][0] is not None)
                         for revlog, details in _gather_revlog(files):
                             file_details = {}
                             revlog_target_id = revlog.split(b'/', 1)[1]
                             if strip_filename and b'/' in revlog:
                                 revlog_target_id = revlog_target_id.rsplit(b'/', 1)[0]
                                 revlog_target_id += b'/'
                             for ext, (t, s) in sorted(details.items()):
                                 file_details[ext] = {
                                     'is_volatile': bool(t & FILEFLAGS_VOLATILE),
                                     'file_size': s,
                                 }
                             yield RevlogStoreEntry(
                                 path_prefix=revlog,
                                 revlog_type=rl_type,
                                 target_id=revlog_target_id,
                                 details=file_details,
                             )
                 def top_entries(
                     self, phase=False, obsolescence=False
                 ) -> Generator[BaseStoreEntry, None, None]:
                     if phase and self.vfs.exists(b'phaseroots'):
                         yield SimpleStoreEntry(
                             entry_path=b'phaseroots',
                             is_volatile=True,
                         )
                     if obsolescence and self.vfs.exists(b'obsstore'):
                         # XXX if we had the file size it could be non-volatile
                         yield SimpleStoreEntry(
                             entry_path=b'obsstore',
                             is_volatile=True,
                         )
                     files = reversed(self._walk(b'', False))
                     changelogs = collections.defaultdict(dict)
                     manifestlogs = collections.defaultdict(dict)
                     for u, (t, s) in files:
                         if u.startswith(b'00changelog'):
                             name, ext = _split_revlog_ext(u)
                             changelogs[name][ext] = (t, s)
                         elif u.startswith(b'00manifest'):
                             name, ext = _split_revlog_ext(u)
                             manifestlogs[name][ext] = (t, s)
                         else:
                             yield SimpleStoreEntry(
                                 entry_path=u,
                                 is_volatile=bool(t & FILEFLAGS_VOLATILE),
                                 file_size=s,
                             )
                     # yield manifest before changelog
                     top_rl = [
                         (manifestlogs, FILEFLAGS_MANIFESTLOG),
                         (changelogs, FILEFLAGS_CHANGELOG),
                     ]
                     assert len(manifestlogs) <= 1
                     assert len(changelogs) <= 1
                     for data, revlog_type in top_rl:
                         for revlog, details in sorted(data.items()):
                             file_details = {}
                             for ext, (t, s) in details.items():
                                 file_details[ext] = {
                                     'is_volatile': bool(t & FILEFLAGS_VOLATILE),
                                     'file_size': s,
                                 }
                             yield RevlogStoreEntry(
                                 path_prefix=revlog,
                                 revlog_type=revlog_type,
                                 target_id=b'',
                                 details=file_details,
                             )
                 def walk(
                     self, matcher=None, phase=False, obsolescence=False
                 ) -> Generator[BaseStoreEntry, None, None]:
                     """return files related to data storage (ie: revlogs)
                     yields instance from BaseStoreEntry subclasses
                     if a matcher is passed, storage files of only those tracked paths
                     are passed with matches the matcher
                     """
                     # yield data files first
                     for x in self.data_entries(matcher):
                         yield x
                     for x in self.top_entries(phase=phase, obsolescence=obsolescence):
                         yield x
                 def copylist(self):
                     return _data
                 def write(self, tr):
                     pass
                 def invalidatecaches(self):
                     pass
                 def markremoved(self, fn):
                     pass
                 def __contains__(self, path):
                     '''Checks if the store contains path'''
                     path = b"/".join((b"data", path))
                     # file?
                     if self.vfs.exists(path + b".i"):
                         return True
                     # dir?
                     if not path.endswith(b"/"):
                         path = path + b"/"
                     return self.vfs.exists(path)
             class encodedstore(basicstore):
                 def __init__(self, path, vfstype):
                     vfs = vfstype(path + b'/store')
                     self.path = vfs.base
                     self.createmode = _calcmode(vfs)
                     vfs.createmode = self.createmode
                     self.rawvfs = vfs
                     self.vfs = vfsmod.filtervfs(vfs, encodefilename)
                     self.opener = self.vfs
                 def _walk(self, relpath, recurse, undecodable=None):
                     old = super()._walk(relpath, recurse)
                     new = []
                     for f1, value in old:
                         try:
                             f2 = decodefilename(f1)
                         except KeyError:
                             if undecodable is None:
                                 msg = _(b'undecodable revlog name %s') % f1
                                 raise error.StorageError(msg)
                             else:
                                 undecodable.append(f1)
                                 continue
                         new.append((f2, value))
                     return new
                 def data_entries(
                     self, matcher=None, undecodable=None
                 ) -> Generator[BaseStoreEntry, None, None]:
                     entries = super(encodedstore, self).data_entries(
                         undecodable=undecodable
                     )
                     for entry in entries:
                         if _match_tracked_entry(entry, matcher):
                             yield entry
                 def join(self, f):
                     return self.path + b'/' + encodefilename(f)
                 def copylist(self):
                     return [b'requires', b'00changelog.i'] + [b'store/' + f for f in _data]
             class fncache:
                 # the filename used to be partially encoded
                 # hence the encodedir/decodedir dance
                 def __init__(self, vfs):
                     self.vfs = vfs
                     self._ignores = set()
                     self.entries = None
                     self._dirty = False
                     # set of new additions to fncache
                     self.addls = set()
                 def ensureloaded(self, warn=None):
                     """read the fncache file if not already read.
                     If the file on disk is corrupted, raise. If warn is provided,
                     warn and keep going instead."""
                     if self.entries is None:
                         self._load(warn)
                 def _load(self, warn=None):
                     '''fill the entries from the fncache file'''
                     self._dirty = False
                     try:
                         fp = self.vfs(b'fncache', mode=b'rb')
                     except IOError:
                         # skip nonexistent file
                         self.entries = set()
                         return
                     self.entries = set()
                     chunk = b''
                     for c in iter(functools.partial(fp.read, fncache_chunksize), b''):
                         chunk += c
                         try:
                             p = chunk.rindex(b'\n')
                             self.entries.update(decodedir(chunk[: p + 1]).splitlines())
                             chunk = chunk[p + 1 :]
                         except ValueError:
                             # substring '\n' not found, maybe the entry is bigger than the
                             # chunksize, so let's keep iterating
                             pass
                     if chunk:
                         msg = _(b"fncache does not ends with a newline")
                         if warn:
                             warn(msg + b'\n')
                         else:
                             raise error.Abort(
                                 msg,
                                 hint=_(
                                     b"use 'hg debugrebuildfncache' to "
                                     b"rebuild the fncache"
                                 ),
                             )
                     self._checkentries(fp, warn)
                     fp.close()
                 def _checkentries(self, fp, warn):
                     """make sure there is no empty string in entries"""
                     if b'' in self.entries:
                         fp.seek(0)
                         for n, line in enumerate(fp):
                             if not line.rstrip(b'\n'):
                                 t = _(b'invalid entry in fncache, line %d') % (n + 1)
                                 if warn:
                                     warn(t + b'\n')
                                 else:
                                     raise error.Abort(t)
                 def write(self, tr):
                     if self._dirty:
                         assert self.entries is not None
                         self.entries = self.entries | self.addls
                         self.addls = set()
                         tr.addbackup(b'fncache')
                         fp = self.vfs(b'fncache', mode=b'wb', atomictemp=True)
                         if self.entries:
                             fp.write(encodedir(b'\n'.join(self.entries) + b'\n'))
                         fp.close()
                         self._dirty = False
                     if self.addls:
                         # if we have just new entries, let's append them to the fncache
                         tr.addbackup(b'fncache')
                         fp = self.vfs(b'fncache', mode=b'ab', atomictemp=True)
                         if self.addls:
                             fp.write(encodedir(b'\n'.join(self.addls) + b'\n'))
                         fp.close()
                         self.entries = None
                         self.addls = set()
                 def addignore(self, fn):
                     self._ignores.add(fn)
                 def add(self, fn):
                     if fn in self._ignores:
                         return
                     if self.entries is None:
                         self._load()
                     if fn not in self.entries:
                         self.addls.add(fn)
                 def remove(self, fn):
                     if self.entries is None:
                         self._load()
                     if fn in self.addls:
                         self.addls.remove(fn)
                         return
                     try:
                         self.entries.remove(fn)
                         self._dirty = True
                     except KeyError:
                         pass
                 def __contains__(self, fn):
                     if fn in self.addls:
                         return True
                     if self.entries is None:
                         self._load()
                     return fn in self.entries
                 def __iter__(self):
                     if self.entries is None:
                         self._load()
                     return iter(self.entries | self.addls)
             class _fncachevfs(vfsmod.proxyvfs):
                 def __init__(self, vfs, fnc, encode):
                     vfsmod.proxyvfs.__init__(self, vfs)
                     self.fncache = fnc
                     self.encode = encode
                 def __call__(self, path, mode=b'r', *args, **kw):
                     encoded = self.encode(path)
                     if (
                         mode not in (b'r', b'rb')
                         and (path.startswith(b'data/') or path.startswith(b'meta/'))
                         and revlog_type(path) is not None
                     ):
                         # do not trigger a fncache load when adding a file that already is
                         # known to exist.
                         notload = self.fncache.entries is None and self.vfs.exists(encoded)
                         if notload and b'r+' in mode and not self.vfs.stat(encoded).st_size:
                             # when appending to an existing file, if the file has size zero,
                             # it should be considered as missing. Such zero-size files are
                             # the result of truncation when a transaction is aborted.
                             notload = False
                         if not notload:
                             self.fncache.add(path)
                     return self.vfs(encoded, mode, *args, **kw)
                 def join(self, path):
                     if path:
                         return self.vfs.join(self.encode(path))
                     else:
                         return self.vfs.join(path)
                 def register_file(self, path):
                     """generic hook point to lets fncache steer its stew"""
                     if path.startswith(b'data/') or path.startswith(b'meta/'):
                         self.fncache.add(path)
             class fncachestore(basicstore):
                 def __init__(self, path, vfstype, dotencode):
                     if dotencode:
                         encode = _pathencode
                     else:
                         encode = _plainhybridencode
                     self.encode = encode
                     vfs = vfstype(path + b'/store')
                     self.path = vfs.base
                     self.pathsep = self.path + b'/'
                     self.createmode = _calcmode(vfs)
                     vfs.createmode = self.createmode
                     self.rawvfs = vfs
                     fnc = fncache(vfs)
                     self.fncache = fnc
                     self.vfs = _fncachevfs(vfs, fnc, encode)
                     self.opener = self.vfs
                 def join(self, f):
                     return self.pathsep + self.encode(f)
                 def getsize(self, path):
                     return self.rawvfs.stat(path).st_size
                 def data_entries(
                     self, matcher=None, undecodable=None
                 ) -> Generator[BaseStoreEntry, None, None]:
                     files = ((f, revlog_type(f)) for f in self.fncache)
                     # Note: all files in fncache should be revlog related, However the
                     # fncache might contains such file added by previous version of
                     # Mercurial.
                     files = (f for f in files if f[1] is not None)
                     by_revlog = _gather_revlog(files)
                     for revlog, details in by_revlog:
                         file_details = {}
                         if revlog.startswith(b'data/'):
                             rl_type = FILEFLAGS_FILELOG
                             revlog_target_id = revlog.split(b'/', 1)[1]
                         elif revlog.startswith(b'meta/'):
                             rl_type = FILEFLAGS_MANIFESTLOG
                             # drop the initial directory and the `00manifest` file part
                             tmp = revlog.split(b'/', 1)[1]
                             revlog_target_id = tmp.rsplit(b'/', 1)[0] + b'/'
                         else:
                             # unreachable
                             assert False, revlog
                         for ext, t in details.items():
                             file_details[ext] = {
                                 'is_volatile': bool(t & FILEFLAGS_VOLATILE),
                             }
                         entry = RevlogStoreEntry(
                             path_prefix=revlog,
                             revlog_type=rl_type,
                             target_id=revlog_target_id,
                             details=file_details,
                         )
                         if _match_tracked_entry(entry, matcher):
                             yield entry
                 def copylist(self):
                     d = (
                         b'bookmarks',
                         b'narrowspec',
                         b'data',
                         b'meta',
                         b'dh',
                         b'fncache',
                         b'phaseroots',
                         b'obsstore',
                         b'00manifest.d',
                         b'00manifest.i',
                         b'00changelog.d',
                         b'00changelog.i',
                         b'requires',
                     )
                     return [b'requires', b'00changelog.i'] + [b'store/' + f for f in d]
                 def write(self, tr):
                     self.fncache.write(tr)
                 def invalidatecaches(self):
                     self.fncache.entries = None
                     self.fncache.addls = set()
                 def markremoved(self, fn):
                     self.fncache.remove(fn)
                 def _exists(self, f):
                     ef = self.encode(f)
                     try:
                         self.getsize(ef)
                         return True
                     except FileNotFoundError:
                         return False
                 def __contains__(self, path):
                     '''Checks if the store contains path'''
                     path = b"/".join((b"data", path))
                     # check for files (exact match)
                     e = path + b'.i'
                     if e in self.fncache and self._exists(e):
                         return True
                     # now check for directories (prefix match)
                     if not path.endswith(b'/'):
                         path += b'/'
                     for e in self.fncache:
                         if e.startswith(path) and self._exists(e):
                             return True
                     return False