upstream/mercurial-mirror Commit - r51561:6b522a9e

1

# store.py - repository store handling for Mercurial

1

# store.py - repository store handling for Mercurial

2

#

2

#

3

4

#

4

#

5

# This software may be used and distributed according to the terms of the

5

# This software may be used and distributed according to the terms of the

6

# GNU General Public License version 2 or any later version.

6

# GNU General Public License version 2 or any later version.

7

8

import collections

8

import collections

9

import functools

9

import functools

10

import os

10

import os

11

import re

11

import re

12

import stat

12

import stat

13

from typing import Generator, List

13

from typing import Generator, List

14

15

from .i18n import _

15

from .i18n import _

16

from .pycompat import getattr

16

from .pycompat import getattr

17

from .thirdparty import attr

17

from .thirdparty import attr

18

from .node import hex

18

from .node import hex

19

from . import (

19

from . import (

20

changelog,

20

changelog,

21

error,

21

error,

22

filelog,

22

filelog,

23

manifest,

23

manifest,

24

policy,

24

policy,

25

pycompat,

25

pycompat,

26

util,

26

util,

27

vfs as vfsmod,

27

vfs as vfsmod,

28

)

28

)

29

from .utils import hashutil

29

from .utils import hashutil

30

31

parsers = policy.importmod('parsers')

31

parsers = policy.importmod('parsers')

32

# how much bytes should be read from fncache in one read

32

# how much bytes should be read from fncache in one read

33

# It is done to prevent loading large fncache files into memory

33

# It is done to prevent loading large fncache files into memory

34

fncache_chunksize = 10 ** 6

34

fncache_chunksize = 10 ** 6

35

36

37

def _match_tracked_entry(entry, matcher):

37

def _match_tracked_entry(entry, matcher):

38

"""parses a fncache entry and returns whether the entry is tracking a path

38

"""parses a fncache entry and returns whether the entry is tracking a path

39

matched by matcher or not.

39

matched by matcher or not.

40

41

If matcher is None, returns True"""

41

If matcher is None, returns True"""

42

43

if matcher is None:

43

if matcher is None:

44

return True

44

return True

45

if entry.is_filelog:

45

if entry.is_filelog:

46

return matcher(entry.target_id)

46

return matcher(entry.target_id)

47

elif entry.is_manifestlog:

47

elif entry.is_manifestlog:

48

return matcher.visitdir(entry.target_id.rstrip(b'/'))

48

return matcher.visitdir(entry.target_id.rstrip(b'/'))

49

raise error.ProgrammingError(b"cannot process entry %r" % entry)

49

raise error.ProgrammingError(b"cannot process entry %r" % entry)

50

51

52

# This avoids a collision between a file named foo and a dir named

52

# This avoids a collision between a file named foo and a dir named

53

# foo.i or foo.d

53

# foo.i or foo.d

54

def _encodedir(path):

54

def _encodedir(path):

55

"""

55

"""

56

>>> _encodedir(b'data/foo.i')

56

>>> _encodedir(b'data/foo.i')

57

'data/foo.i'

57

'data/foo.i'

58

>>> _encodedir(b'data/foo.i/bla.i')

58

>>> _encodedir(b'data/foo.i/bla.i')

59

'data/foo.i.hg/bla.i'

59

'data/foo.i.hg/bla.i'

60

>>> _encodedir(b'data/foo.i.hg/bla.i')

60

>>> _encodedir(b'data/foo.i.hg/bla.i')

61

'data/foo.i.hg.hg/bla.i'

61

'data/foo.i.hg.hg/bla.i'

62

>>> _encodedir(b'data/foo.i\\ndata/foo.i/bla.i\\ndata/foo.i.hg/bla.i\\n')

62

>>> _encodedir(b'data/foo.i\\ndata/foo.i/bla.i\\ndata/foo.i.hg/bla.i\\n')

63

'data/foo.i\\ndata/foo.i.hg/bla.i\\ndata/foo.i.hg.hg/bla.i\\n'

63

'data/foo.i\\ndata/foo.i.hg/bla.i\\ndata/foo.i.hg.hg/bla.i\\n'

64

"""

64

"""

65

return (

65

return (

66

path.replace(b".hg/", b".hg.hg/")

66

path.replace(b".hg/", b".hg.hg/")

67

.replace(b".i/", b".i.hg/")

67

.replace(b".i/", b".i.hg/")

68

.replace(b".d/", b".d.hg/")

68

.replace(b".d/", b".d.hg/")

69

)

69

)

70

71

72

encodedir = getattr(parsers, 'encodedir', _encodedir)

72

encodedir = getattr(parsers, 'encodedir', _encodedir)

73

74

75

def decodedir(path):

75

def decodedir(path):

76

"""

76

"""

77

>>> decodedir(b'data/foo.i')

77

>>> decodedir(b'data/foo.i')

78

'data/foo.i'

78

'data/foo.i'

79

>>> decodedir(b'data/foo.i.hg/bla.i')

79

>>> decodedir(b'data/foo.i.hg/bla.i')

80

'data/foo.i/bla.i'

80

'data/foo.i/bla.i'

81

>>> decodedir(b'data/foo.i.hg.hg/bla.i')

81

>>> decodedir(b'data/foo.i.hg.hg/bla.i')

82

'data/foo.i.hg/bla.i'

82

'data/foo.i.hg/bla.i'

83

"""

83

"""

84

if b".hg/" not in path:

84

if b".hg/" not in path:

85

return path

85

return path

86

return (

86

return (

87

path.replace(b".d.hg/", b".d/")

87

path.replace(b".d.hg/", b".d/")

88

.replace(b".i.hg/", b".i/")

88

.replace(b".i.hg/", b".i/")

89

.replace(b".hg.hg/", b".hg/")

89

.replace(b".hg.hg/", b".hg/")

90

)

90

)

91

92

93

def _reserved():

93

def _reserved():

94

"""characters that are problematic for filesystems

94

"""characters that are problematic for filesystems

95

96

* ascii escapes (0..31)

96

* ascii escapes (0..31)

97

* ascii hi (126..255)

97

* ascii hi (126..255)

98

* windows specials

98

* windows specials

99

100

these characters will be escaped by encodefunctions

100

these characters will be escaped by encodefunctions

101

"""

101

"""

102

winreserved = [ord(x) for x in u'\\:*?"<>|']

102

winreserved = [ord(x) for x in u'\\:*?"<>|']

103

for x in range(32):

103

for x in range(32):

104

yield x

104

yield x

105

for x in range(126, 256):

105

for x in range(126, 256):

106

yield x

106

yield x

107

for x in winreserved:

107

for x in winreserved:

108

yield x

108

yield x

109

110

111

def _buildencodefun():

111

def _buildencodefun():

112

"""

112

"""

113

>>> enc, dec = _buildencodefun()

113

>>> enc, dec = _buildencodefun()

114

115

>>> enc(b'nothing/special.txt')

115

>>> enc(b'nothing/special.txt')

116

'nothing/special.txt'

116

'nothing/special.txt'

117

>>> dec(b'nothing/special.txt')

117

>>> dec(b'nothing/special.txt')

118

'nothing/special.txt'

118

'nothing/special.txt'

119

120

>>> enc(b'HELLO')

120

>>> enc(b'HELLO')

121

'_h_e_l_l_o'

121

'_h_e_l_l_o'

122

>>> dec(b'_h_e_l_l_o')

122

>>> dec(b'_h_e_l_l_o')

123

'HELLO'

123

'HELLO'

124

125

>>> enc(b'hello:world?')

125

>>> enc(b'hello:world?')

126

'hello~3aworld~3f'

126

'hello~3aworld~3f'

127

>>> dec(b'hello~3aworld~3f')

127

>>> dec(b'hello~3aworld~3f')

128

'hello:world?'

128

'hello:world?'

129

130

>>> enc(b'the\\x07quick\\xADshot')

130

>>> enc(b'the\\x07quick\\xADshot')

131

'the~07quick~adshot'

131

'the~07quick~adshot'

132

>>> dec(b'the~07quick~adshot')

132

>>> dec(b'the~07quick~adshot')

133

'the\\x07quick\\xadshot'

133

'the\\x07quick\\xadshot'

134

"""

134

"""

135

e = b'_'

135

e = b'_'

136

xchr = pycompat.bytechr

136

xchr = pycompat.bytechr

137

asciistr = list(map(xchr, range(127)))

137

asciistr = list(map(xchr, range(127)))

138

capitals = list(range(ord(b"A"), ord(b"Z") + 1))

138

capitals = list(range(ord(b"A"), ord(b"Z") + 1))

139

140

cmap = {x: x for x in asciistr}

140

cmap = {x: x for x in asciistr}

141

for x in _reserved():

141

for x in _reserved():

142

cmap[xchr(x)] = b"~%02x" % x

142

cmap[xchr(x)] = b"~%02x" % x

143

for x in capitals + [ord(e)]:

143

for x in capitals + [ord(e)]:

144

cmap[xchr(x)] = e + xchr(x).lower()

144

cmap[xchr(x)] = e + xchr(x).lower()

145

146

dmap = {}

146

dmap = {}

147

for k, v in cmap.items():

147

for k, v in cmap.items():

148

dmap[v] = k

148

dmap[v] = k

149

150

def decode(s):

150

def decode(s):

151

i = 0

151

i = 0

152

while i < len(s):

152

while i < len(s):

153

for l in range(1, 4):

153

for l in range(1, 4):

154

try:

154

try:

155

yield dmap[s[i : i + l]]

155

yield dmap[s[i : i + l]]

156

i += l

156

i += l

157

break

157

break

158

except KeyError:

158

except KeyError:

159

pass

159

pass

160

else:

160

else:

161

raise KeyError

161

raise KeyError

162

163

return (

163

return (

164

lambda s: b''.join([cmap[s[c : c + 1]] for c in range(len(s))]),

164

lambda s: b''.join([cmap[s[c : c + 1]] for c in range(len(s))]),

165

lambda s: b''.join(list(decode(s))),

165

lambda s: b''.join(list(decode(s))),

166

)

166

)

167

168

169

_encodefname, _decodefname = _buildencodefun()

169

_encodefname, _decodefname = _buildencodefun()

170

171

172

def encodefilename(s):

172

def encodefilename(s):

173

"""

173

"""

174

>>> encodefilename(b'foo.i/bar.d/bla.hg/hi:world?/HELLO')

174

>>> encodefilename(b'foo.i/bar.d/bla.hg/hi:world?/HELLO')

175

'foo.i.hg/bar.d.hg/bla.hg.hg/hi~3aworld~3f/_h_e_l_l_o'

175

'foo.i.hg/bar.d.hg/bla.hg.hg/hi~3aworld~3f/_h_e_l_l_o'

176

"""

176

"""

177

return _encodefname(encodedir(s))

177

return _encodefname(encodedir(s))

178

179

180

def decodefilename(s):

180

def decodefilename(s):

181

"""

181

"""

182

>>> decodefilename(b'foo.i.hg/bar.d.hg/bla.hg.hg/hi~3aworld~3f/_h_e_l_l_o')

182

>>> decodefilename(b'foo.i.hg/bar.d.hg/bla.hg.hg/hi~3aworld~3f/_h_e_l_l_o')

183

'foo.i/bar.d/bla.hg/hi:world?/HELLO'

183

'foo.i/bar.d/bla.hg/hi:world?/HELLO'

184

"""

184

"""

185

return decodedir(_decodefname(s))

185

return decodedir(_decodefname(s))

186

187

188

def _buildlowerencodefun():

188

def _buildlowerencodefun():

189

"""

189

"""

190

>>> f = _buildlowerencodefun()

190

>>> f = _buildlowerencodefun()

191

>>> f(b'nothing/special.txt')

191

>>> f(b'nothing/special.txt')

192

'nothing/special.txt'

192

'nothing/special.txt'

193

>>> f(b'HELLO')

193

>>> f(b'HELLO')

194

'hello'

194

'hello'

195

>>> f(b'hello:world?')

195

>>> f(b'hello:world?')

196

'hello~3aworld~3f'

196

'hello~3aworld~3f'

197

>>> f(b'the\\x07quick\\xADshot')

197

>>> f(b'the\\x07quick\\xADshot')

198

'the~07quick~adshot'

198

'the~07quick~adshot'

199

"""

199

"""

200

xchr = pycompat.bytechr

200

xchr = pycompat.bytechr

201

cmap = {xchr(x): xchr(x) for x in range(127)}

201

cmap = {xchr(x): xchr(x) for x in range(127)}

202

for x in _reserved():

202

for x in _reserved():

203

cmap[xchr(x)] = b"~%02x" % x

203

cmap[xchr(x)] = b"~%02x" % x

204

for x in range(ord(b"A"), ord(b"Z") + 1):

204

for x in range(ord(b"A"), ord(b"Z") + 1):

205

cmap[xchr(x)] = xchr(x).lower()

205

cmap[xchr(x)] = xchr(x).lower()

206

207

def lowerencode(s):

207

def lowerencode(s):

208

return b"".join([cmap[c] for c in pycompat.iterbytestr(s)])

208

return b"".join([cmap[c] for c in pycompat.iterbytestr(s)])

209

210

return lowerencode

210

return lowerencode

211

212

213

lowerencode = getattr(parsers, 'lowerencode', None) or _buildlowerencodefun()

213

lowerencode = getattr(parsers, 'lowerencode', None) or _buildlowerencodefun()

214

215

# Windows reserved names: con, prn, aux, nul, com1..com9, lpt1..lpt9

215

# Windows reserved names: con, prn, aux, nul, com1..com9, lpt1..lpt9

216

_winres3 = (b'aux', b'con', b'prn', b'nul') # length 3

216

_winres3 = (b'aux', b'con', b'prn', b'nul') # length 3

217

_winres4 = (b'com', b'lpt') # length 4 (with trailing 1..9)

217

_winres4 = (b'com', b'lpt') # length 4 (with trailing 1..9)

218

219

220

def _auxencode(path, dotencode):

220

def _auxencode(path, dotencode):

221

"""

221

"""

222

Encodes filenames containing names reserved by Windows or which end in

222

Encodes filenames containing names reserved by Windows or which end in

223

period or space. Does not touch other single reserved characters c.

223

period or space. Does not touch other single reserved characters c.

224

Specifically, c in '\\:*?"<>|' or ord(c) <= 31 are *not* encoded here.

224

Specifically, c in '\\:*?"<>|' or ord(c) <= 31 are *not* encoded here.

225

Additionally encodes space or period at the beginning, if dotencode is

225

Additionally encodes space or period at the beginning, if dotencode is

226

True. Parameter path is assumed to be all lowercase.

226

True. Parameter path is assumed to be all lowercase.

227

A segment only needs encoding if a reserved name appears as a

227

A segment only needs encoding if a reserved name appears as a

228

basename (e.g. "aux", "aux.foo"). A directory or file named "foo.aux"

228

basename (e.g. "aux", "aux.foo"). A directory or file named "foo.aux"

229

doesn't need encoding.

229

doesn't need encoding.

230

231

>>> s = b'.foo/aux.txt/txt.aux/con/prn/nul/foo.'

231

>>> s = b'.foo/aux.txt/txt.aux/con/prn/nul/foo.'

232

>>> _auxencode(s.split(b'/'), True)

232

>>> _auxencode(s.split(b'/'), True)

233

['~2efoo', 'au~78.txt', 'txt.aux', 'co~6e', 'pr~6e', 'nu~6c', 'foo~2e']

233

['~2efoo', 'au~78.txt', 'txt.aux', 'co~6e', 'pr~6e', 'nu~6c', 'foo~2e']

234

>>> s = b'.com1com2/lpt9.lpt4.lpt1/conprn/com0/lpt0/foo.'

234

>>> s = b'.com1com2/lpt9.lpt4.lpt1/conprn/com0/lpt0/foo.'

235

>>> _auxencode(s.split(b'/'), False)

235

>>> _auxencode(s.split(b'/'), False)

236

['.com1com2', 'lp~749.lpt4.lpt1', 'conprn', 'com0', 'lpt0', 'foo~2e']

236

['.com1com2', 'lp~749.lpt4.lpt1', 'conprn', 'com0', 'lpt0', 'foo~2e']

237

>>> _auxencode([b'foo. '], True)

237

>>> _auxencode([b'foo. '], True)

238

['foo.~20']

238

['foo.~20']

239

>>> _auxencode([b' .foo'], True)

239

>>> _auxencode([b' .foo'], True)

240

['~20.foo']

240

['~20.foo']

241

"""

241

"""

242

for i, n in enumerate(path):

242

for i, n in enumerate(path):

243

if not n:

243

if not n:

244

continue

244

continue

245

if dotencode and n[0] in b'. ':

245

if dotencode and n[0] in b'. ':

246

n = b"~%02x" % ord(n[0:1]) + n[1:]

246

n = b"~%02x" % ord(n[0:1]) + n[1:]

247

path[i] = n

247

path[i] = n

248

else:

248

else:

249

l = n.find(b'.')

249

l = n.find(b'.')

250

if l == -1:

250

if l == -1:

251

l = len(n)

251

l = len(n)

252

if (l == 3 and n[:3] in _winres3) or (

252

if (l == 3 and n[:3] in _winres3) or (

253

l == 4

253

l == 4

254

and n[3:4] <= b'9'

254

and n[3:4] <= b'9'

255

and n[3:4] >= b'1'

255

and n[3:4] >= b'1'

256

and n[:3] in _winres4

256

and n[:3] in _winres4

257

):

257

):

258

# encode third letter ('aux' -> 'au~78')

258

# encode third letter ('aux' -> 'au~78')

259

ec = b"~%02x" % ord(n[2:3])

259

ec = b"~%02x" % ord(n[2:3])

260

n = n[0:2] + ec + n[3:]

260

n = n[0:2] + ec + n[3:]

261

path[i] = n

261

path[i] = n

262

if n[-1] in b'. ':

262

if n[-1] in b'. ':

263

# encode last period or space ('foo...' -> 'foo..~2e')

263

# encode last period or space ('foo...' -> 'foo..~2e')

264

path[i] = n[:-1] + b"~%02x" % ord(n[-1:])

264

path[i] = n[:-1] + b"~%02x" % ord(n[-1:])

265

return path

265

return path

266

267

268

_maxstorepathlen = 120

268

_maxstorepathlen = 120

269

_dirprefixlen = 8

269

_dirprefixlen = 8

270

_maxshortdirslen = 8 * (_dirprefixlen + 1) - 4

270

_maxshortdirslen = 8 * (_dirprefixlen + 1) - 4

271

272

273

def _hashencode(path, dotencode):

273

def _hashencode(path, dotencode):

274

digest = hex(hashutil.sha1(path).digest())

274

digest = hex(hashutil.sha1(path).digest())

275

le = lowerencode(path[5:]).split(b'/') # skips prefix 'data/' or 'meta/'

275

le = lowerencode(path[5:]).split(b'/') # skips prefix 'data/' or 'meta/'

276

parts = _auxencode(le, dotencode)

276

parts = _auxencode(le, dotencode)

277

basename = parts[-1]

277

basename = parts[-1]

278

_root, ext = os.path.splitext(basename)

278

_root, ext = os.path.splitext(basename)

279

sdirs = []

279

sdirs = []

280

sdirslen = 0

280

sdirslen = 0

281

for p in parts[:-1]:

281

for p in parts[:-1]:

282

d = p[:_dirprefixlen]

282

d = p[:_dirprefixlen]

283

if d[-1] in b'. ':

283

if d[-1] in b'. ':

284

# Windows can't access dirs ending in period or space

284

# Windows can't access dirs ending in period or space

285

d = d[:-1] + b'_'

285

d = d[:-1] + b'_'

286

if sdirslen == 0:

286

if sdirslen == 0:

287

t = len(d)

287

t = len(d)

288

else:

288

else:

289

t = sdirslen + 1 + len(d)

289

t = sdirslen + 1 + len(d)

290

if t > _maxshortdirslen:

290

if t > _maxshortdirslen:

291

break

291

break

292

sdirs.append(d)

292

sdirs.append(d)

293

sdirslen = t

293

sdirslen = t

294

dirs = b'/'.join(sdirs)

294

dirs = b'/'.join(sdirs)

295

if len(dirs) > 0:

295

if len(dirs) > 0:

296

dirs += b'/'

296

dirs += b'/'

297

res = b'dh/' + dirs + digest + ext

297

res = b'dh/' + dirs + digest + ext

298

spaceleft = _maxstorepathlen - len(res)

298

spaceleft = _maxstorepathlen - len(res)

299

if spaceleft > 0:

299

if spaceleft > 0:

300

filler = basename[:spaceleft]

300

filler = basename[:spaceleft]

301

res = b'dh/' + dirs + filler + digest + ext

301

res = b'dh/' + dirs + filler + digest + ext

302

return res

302

return res

303

304

305

def _hybridencode(path, dotencode):

305

def _hybridencode(path, dotencode):

306

"""encodes path with a length limit

306

"""encodes path with a length limit

307

308

Encodes all paths that begin with 'data/', according to the following.

308

Encodes all paths that begin with 'data/', according to the following.

309

310

Default encoding (reversible):

310

Default encoding (reversible):

311

312

Encodes all uppercase letters 'X' as '_x'. All reserved or illegal

312

Encodes all uppercase letters 'X' as '_x'. All reserved or illegal

313

characters are encoded as '~xx', where xx is the two digit hex code

313

characters are encoded as '~xx', where xx is the two digit hex code

314

of the character (see encodefilename).

314

of the character (see encodefilename).

315

Relevant path components consisting of Windows reserved filenames are

315

Relevant path components consisting of Windows reserved filenames are

316

masked by encoding the third character ('aux' -> 'au~78', see _auxencode).

316

masked by encoding the third character ('aux' -> 'au~78', see _auxencode).

317

318

Hashed encoding (not reversible):

318

Hashed encoding (not reversible):

319

320

If the default-encoded path is longer than _maxstorepathlen, a

320

If the default-encoded path is longer than _maxstorepathlen, a

321

non-reversible hybrid hashing of the path is done instead.

321

non-reversible hybrid hashing of the path is done instead.

322

This encoding uses up to _dirprefixlen characters of all directory

322

This encoding uses up to _dirprefixlen characters of all directory

323

levels of the lowerencoded path, but not more levels than can fit into

323

levels of the lowerencoded path, but not more levels than can fit into

324

_maxshortdirslen.

324

_maxshortdirslen.

325

Then follows the filler followed by the sha digest of the full path.

325

Then follows the filler followed by the sha digest of the full path.

326

The filler is the beginning of the basename of the lowerencoded path

326

The filler is the beginning of the basename of the lowerencoded path

327

(the basename is everything after the last path separator). The filler

327

(the basename is everything after the last path separator). The filler

328

is as long as possible, filling in characters from the basename until

328

is as long as possible, filling in characters from the basename until

329

the encoded path has _maxstorepathlen characters (or all chars of the

329

the encoded path has _maxstorepathlen characters (or all chars of the

330

basename have been taken).

330

basename have been taken).

331

The extension (e.g. '.i' or '.d') is preserved.

331

The extension (e.g. '.i' or '.d') is preserved.

332

333

The string 'data/' at the beginning is replaced with 'dh/', if the hashed

333

The string 'data/' at the beginning is replaced with 'dh/', if the hashed

334

encoding was used.

334

encoding was used.

335

"""

335

"""

336

path = encodedir(path)

336

path = encodedir(path)

337

ef = _encodefname(path).split(b'/')

337

ef = _encodefname(path).split(b'/')

338

res = b'/'.join(_auxencode(ef, dotencode))

338

res = b'/'.join(_auxencode(ef, dotencode))

339

if len(res) > _maxstorepathlen:

339

if len(res) > _maxstorepathlen:

340

res = _hashencode(path, dotencode)

340

res = _hashencode(path, dotencode)

341

return res

341

return res

342

343

344

def _pathencode(path):

344

def _pathencode(path):

345

de = encodedir(path)

345

de = encodedir(path)

346

if len(path) > _maxstorepathlen:

346

if len(path) > _maxstorepathlen:

347

return _hashencode(de, True)

347

return _hashencode(de, True)

348

ef = _encodefname(de).split(b'/')

348

ef = _encodefname(de).split(b'/')

349

res = b'/'.join(_auxencode(ef, True))

349

res = b'/'.join(_auxencode(ef, True))

350

if len(res) > _maxstorepathlen:

350

if len(res) > _maxstorepathlen:

351

return _hashencode(de, True)

351

return _hashencode(de, True)

352

return res

352

return res

353

354

355

_pathencode = getattr(parsers, 'pathencode', _pathencode)

355

_pathencode = getattr(parsers, 'pathencode', _pathencode)

356

357

358

def _plainhybridencode(f):

358

def _plainhybridencode(f):

359

return _hybridencode(f, False)

359

return _hybridencode(f, False)

360

361

362

def _calcmode(vfs):

362

def _calcmode(vfs):

363

try:

363

try:

364

# files in .hg/ will be created using this mode

364

# files in .hg/ will be created using this mode

365

mode = vfs.stat().st_mode

365

mode = vfs.stat().st_mode

366

# avoid some useless chmods

366

# avoid some useless chmods

367

if (0o777 & ~util.umask) == (0o777 & mode):

367

if (0o777 & ~util.umask) == (0o777 & mode):

368

mode = None

368

mode = None

369

except OSError:

369

except OSError:

370

mode = None

370

mode = None

371

return mode

371

return mode

372

373

374

_data = [

374

_data = [

375

b'bookmarks',

375

b'bookmarks',

376

b'narrowspec',

376

b'narrowspec',

377

b'data',

377

b'data',

378

b'meta',

378

b'meta',

379

b'00manifest.d',

379

b'00manifest.d',

380

b'00manifest.i',

380

b'00manifest.i',

381

b'00changelog.d',

381

b'00changelog.d',

382

b'00changelog.i',

382

b'00changelog.i',

383

b'phaseroots',

383

b'phaseroots',

384

b'obsstore',

384

b'obsstore',

385

b'requires',

385

b'requires',

386

]

386

]

387

388

REVLOG_FILES_MAIN_EXT = (b'.i',)

388

REVLOG_FILES_MAIN_EXT = (b'.i',)

389

REVLOG_FILES_OTHER_EXT = (

389

REVLOG_FILES_OTHER_EXT = (

390

b'.idx',

390

b'.idx',

391

b'.d',

391

b'.d',

392

b'.dat',

392

b'.dat',

393

b'.n',

393

b'.n',

394

b'.nd',

394

b'.nd',

395

b'.sda',

395

b'.sda',

396

)

396

)

397

# file extension that also use a `-SOMELONGIDHASH.ext` form

397

# file extension that also use a `-SOMELONGIDHASH.ext` form

398

REVLOG_FILES_LONG_EXT = (

398

REVLOG_FILES_LONG_EXT = (

399

b'.nd',

399

b'.nd',

400

b'.idx',

400

b'.idx',

401

b'.dat',

401

b'.dat',

402

b'.sda',

402

b'.sda',

403

)

403

)

404

# files that are "volatile" and might change between listing and streaming

404

# files that are "volatile" and might change between listing and streaming

405

#

405

#

406

# note: the ".nd" file are nodemap data and won't "change" but they might be

406

# note: the ".nd" file are nodemap data and won't "change" but they might be

407

# deleted.

407

# deleted.

408

REVLOG_FILES_VOLATILE_EXT = (b'.n', b'.nd')

408

REVLOG_FILES_VOLATILE_EXT = (b'.n', b'.nd')

409

410

# some exception to the above matching

410

# some exception to the above matching

411

#

411

#

412

# XXX This is currently not in use because of issue6542

412

# XXX This is currently not in use because of issue6542

413

EXCLUDED = re.compile(br'.*undo\.[^/]+\.(nd?|i)$')

413

EXCLUDED = re.compile(br'.*undo\.[^/]+\.(nd?|i)$')

414

415

416

def is_revlog(f, kind, st):

416

def is_revlog(f, kind, st):

417

if kind != stat.S_IFREG:

417

if kind != stat.S_IFREG:

418

return None

418

return None

419

return revlog_type(f)

419

return revlog_type(f)

420

421

422

def revlog_type(f):

422

def revlog_type(f):

423

# XXX we need to filter `undo.` created by the transaction here, however

423

# XXX we need to filter `undo.` created by the transaction here, however

424

# being naive about it also filter revlog for `undo.*` files, leading to

424

# being naive about it also filter revlog for `undo.*` files, leading to

425

# issue6542. So we no longer use EXCLUDED.

425

# issue6542. So we no longer use EXCLUDED.

426

if f.endswith(REVLOG_FILES_MAIN_EXT):

426

if f.endswith(REVLOG_FILES_MAIN_EXT):

427

return FILEFLAGS_REVLOG_MAIN

427

return FILEFLAGS_REVLOG_MAIN

428

elif f.endswith(REVLOG_FILES_OTHER_EXT):

428

elif f.endswith(REVLOG_FILES_OTHER_EXT):

429

t = FILETYPE_FILELOG_OTHER

429

t = FILETYPE_FILELOG_OTHER

430

if f.endswith(REVLOG_FILES_VOLATILE_EXT):

430

if f.endswith(REVLOG_FILES_VOLATILE_EXT):

431

t |= FILEFLAGS_VOLATILE

431

t |= FILEFLAGS_VOLATILE

432

return t

432

return t

433

return None

433

return None

434

435

436

# the file is part of changelog data

436

# the file is part of changelog data

437

FILEFLAGS_CHANGELOG = 1 << 13

437

FILEFLAGS_CHANGELOG = 1 << 13

438

# the file is part of manifest data

438

# the file is part of manifest data

439

FILEFLAGS_MANIFESTLOG = 1 << 12

439

FILEFLAGS_MANIFESTLOG = 1 << 12

440

# the file is part of filelog data

440

# the file is part of filelog data

441

FILEFLAGS_FILELOG = 1 << 11

441

FILEFLAGS_FILELOG = 1 << 11

442

# file that are not directly part of a revlog

442

# file that are not directly part of a revlog

443

FILEFLAGS_OTHER = 1 << 10

443

FILEFLAGS_OTHER = 1 << 10

444

445

# the main entry point for a revlog

445

# the main entry point for a revlog

446

FILEFLAGS_REVLOG_MAIN = 1 << 1

446

FILEFLAGS_REVLOG_MAIN = 1 << 1

447

# a secondary file for a revlog

447

# a secondary file for a revlog

448

FILEFLAGS_REVLOG_OTHER = 1 << 0

448

FILEFLAGS_REVLOG_OTHER = 1 << 0

449

450

# files that are "volatile" and might change between listing and streaming

450

# files that are "volatile" and might change between listing and streaming

451

FILEFLAGS_VOLATILE = 1 << 20

451

FILEFLAGS_VOLATILE = 1 << 20

452

453

FILETYPE_CHANGELOG_MAIN = FILEFLAGS_CHANGELOG | FILEFLAGS_REVLOG_MAIN

453

FILETYPE_CHANGELOG_MAIN = FILEFLAGS_CHANGELOG | FILEFLAGS_REVLOG_MAIN

454

FILETYPE_CHANGELOG_OTHER = FILEFLAGS_CHANGELOG | FILEFLAGS_REVLOG_OTHER

454

FILETYPE_CHANGELOG_OTHER = FILEFLAGS_CHANGELOG | FILEFLAGS_REVLOG_OTHER

455

FILETYPE_MANIFESTLOG_MAIN = FILEFLAGS_MANIFESTLOG | FILEFLAGS_REVLOG_MAIN

455

FILETYPE_MANIFESTLOG_MAIN = FILEFLAGS_MANIFESTLOG | FILEFLAGS_REVLOG_MAIN

456

FILETYPE_MANIFESTLOG_OTHER = FILEFLAGS_MANIFESTLOG | FILEFLAGS_REVLOG_OTHER

456

FILETYPE_MANIFESTLOG_OTHER = FILEFLAGS_MANIFESTLOG | FILEFLAGS_REVLOG_OTHER

457

FILETYPE_FILELOG_MAIN = FILEFLAGS_FILELOG | FILEFLAGS_REVLOG_MAIN

457

FILETYPE_FILELOG_MAIN = FILEFLAGS_FILELOG | FILEFLAGS_REVLOG_MAIN

458

FILETYPE_FILELOG_OTHER = FILEFLAGS_FILELOG | FILEFLAGS_REVLOG_OTHER

458

FILETYPE_FILELOG_OTHER = FILEFLAGS_FILELOG | FILEFLAGS_REVLOG_OTHER

459

FILETYPE_OTHER = FILEFLAGS_OTHER

459

FILETYPE_OTHER = FILEFLAGS_OTHER

460

461

462

@attr.s(slots=True)

462

@attr.s(slots=True)

463

class StoreFile:

463

class StoreFile:

464

"""a file matching a store entry"""

464

"""a file matching a store entry"""

465

466

unencoded_path = attr.ib()

466

unencoded_path = attr.ib()

467

_file_size = attr.ib(default=None)

467

_file_size = attr.ib(default=None)

468

is_volatile = attr.ib(default=False)

468

is_volatile = attr.ib(default=False)

469

470

def file_size(self, vfs):

470

def file_size(self, vfs):

471

if self._file_size is None:

471

if self._file_size is None:

472

if vfs is None:

472

if vfs is None:

473

msg = b"calling vfs-less file_size without prior call: %s"

473

msg = b"calling vfs-less file_size without prior call: %s"

474

msg %= self.unencoded_path

474

msg %= self.unencoded_path

475

raise error.ProgrammingError(msg)

475

raise error.ProgrammingError(msg)

476

try:

476

try:

477

self._file_size = vfs.stat(self.unencoded_path).st_size

477

self._file_size = vfs.stat(self.unencoded_path).st_size

478

except FileNotFoundError:

478

except FileNotFoundError:

479

self._file_size = 0

479

self._file_size = 0

480

return self._file_size

480

return self._file_size

481

482

def get_stream(self, vfs, copies):

482

def get_stream(self, vfs, copies):

483

"""return data "stream" information for this file

483

"""return data "stream" information for this file

484

485

(unencoded_file_path, content_iterator, content_size)

485

(unencoded_file_path, content_iterator, content_size)

486

"""

486

"""

487

size = self.file_size(None)

487

size = self.file_size(None)

488

489

def get_stream():

489

def get_stream():

490

actual_path = copies[vfs.join(self.unencoded_path)]

490

actual_path = copies[vfs.join(self.unencoded_path)]

491

with open(actual_path, 'rb') as fp:

491

with open(actual_path, 'rb') as fp:

492

yield None # ready to stream

492

yield None # ready to stream

493

if size <= 65536:

493

if size <= 65536:

494

yield fp.read(size)

494

yield fp.read(size)

495

else:

495

else:

496

yield from util.filechunkiter(fp, limit=size)

496

yield from util.filechunkiter(fp, limit=size)

497

498

s = get_stream()

498

s = get_stream()

499

next(s)

499

next(s)

500

return (self.unencoded_path, s, size)

500

return (self.unencoded_path, s, size)

501

502

503

@attr.s(slots=True, init=False)

503

@attr.s(slots=True, init=False)

504

class BaseStoreEntry:

504

class BaseStoreEntry:

505

"""An entry in the store

505

"""An entry in the store

506

507

This is returned by `store.walk` and represent some data in the store."""

507

This is returned by `store.walk` and represent some data in the store."""

508

509

def files(self) -> List[StoreFile]:

509

def files(self) -> List[StoreFile]:

510

raise NotImplementedError

510

raise NotImplementedError

511

512

def get_streams(

512

def get_streams(

513

self,

513

self,

514

repo=None,

514

repo=None,

515

vfs=None,

515

vfs=None,

516

copies=None,

516

copies=None,

517

max_changeset=None,

517

max_changeset=None,

518

):

518

):

519

"""return a list of data stream associated to files for this entry

519

"""return a list of data stream associated to files for this entry

520

521

return [(unencoded_file_path, content_iterator, content_size), …]

521

return [(unencoded_file_path, content_iterator, content_size), …]

522

"""

522

"""

523

assert vfs is not None

523

assert vfs is not None

524

return [f.get_stream(vfs, copies) for f in self.files()]

524

return [f.get_stream(vfs, copies) for f in self.files()]

525

526

527

@attr.s(slots=True, init=False)

527

@attr.s(slots=True, init=False)

528

class SimpleStoreEntry(BaseStoreEntry):

528

class SimpleStoreEntry(BaseStoreEntry):

529

"""A generic entry in the store"""

529

"""A generic entry in the store"""

530

531

is_revlog = False

531

is_revlog = False

532

533

_entry_path = attr.ib()

533

_entry_path = attr.ib()

534

_is_volatile = attr.ib(default=False)

534

_is_volatile = attr.ib(default=False)

535

_file_size = attr.ib(default=None)

535

_file_size = attr.ib(default=None)

536

_files = attr.ib(default=None)

536

_files = attr.ib(default=None)

537

538

def __init__(

538

def __init__(

539

self,

539

self,

540

entry_path,

540

entry_path,

541

is_volatile=False,

541

is_volatile=False,

542

file_size=None,

542

file_size=None,

543

):

543

):

544

super().__init__()

544

super().__init__()

545

self._entry_path = entry_path

545

self._entry_path = entry_path

546

self._is_volatile = is_volatile

546

self._is_volatile = is_volatile

547

self._file_size = file_size

547

self._file_size = file_size

548

self._files = None

548

self._files = None

549

550

def files(self) -> List[StoreFile]:

550

def files(self) -> List[StoreFile]:

551

if self._files is None:

551

if self._files is None:

552

self._files = [

552

self._files = [

553

StoreFile(

553

StoreFile(

554

unencoded_path=self._entry_path,

554

unencoded_path=self._entry_path,

555

file_size=self._file_size,

555

file_size=self._file_size,

556

is_volatile=self._is_volatile,

556

is_volatile=self._is_volatile,

557

)

557

)

558

]

558

]

559

return self._files

559

return self._files

560

561

562

@attr.s(slots=True, init=False)

562

@attr.s(slots=True, init=False)

563

class RevlogStoreEntry(BaseStoreEntry):

563

class RevlogStoreEntry(BaseStoreEntry):

564

"""A revlog entry in the store"""

564

"""A revlog entry in the store"""

565

566

is_revlog = True

566

is_revlog = True

567

568

revlog_type = attr.ib(default=None)

568

revlog_type = attr.ib(default=None)

569

target_id = attr.ib(default=None)

569

target_id = attr.ib(default=None)

570

_path_prefix = attr.ib(default=None)

570

_path_prefix = attr.ib(default=None)

571

_details = attr.ib(default=None)

571

_details = attr.ib(default=None)

572

_files = attr.ib(default=None)

572

_files = attr.ib(default=None)

573

574

def __init__(

574

def __init__(

575

self,

575

self,

576

revlog_type,

576

revlog_type,

577

path_prefix,

577

path_prefix,

578

target_id,

578

target_id,

579

details,

579

details,

580

):

580

):

581

super().__init__()

581

super().__init__()

582

self.revlog_type = revlog_type

582

self.revlog_type = revlog_type

583

self.target_id = target_id

583

self.target_id = target_id

584

self._path_prefix = path_prefix

584

self._path_prefix = path_prefix

585

assert b'.i' in details, (path_prefix, details)

585

assert b'.i' in details, (path_prefix, details)

586

self._details = details

586

self._details = details

587

self._files = None

587

self._files = None

588

589

@property

589

@property

590

def is_changelog(self):

590

def is_changelog(self):

591

return self.revlog_type & FILEFLAGS_CHANGELOG

591

return self.revlog_type & FILEFLAGS_CHANGELOG

592

593

@property

593

@property

594

def is_manifestlog(self):

594

def is_manifestlog(self):

595

return self.revlog_type & FILEFLAGS_MANIFESTLOG

595

return self.revlog_type & FILEFLAGS_MANIFESTLOG

596

597

@property

597

@property

598

def is_filelog(self):

598

def is_filelog(self):

599

return self.revlog_type & FILEFLAGS_FILELOG

599

return self.revlog_type & FILEFLAGS_FILELOG

600

601

def main_file_path(self):

601

def main_file_path(self):

602

"""unencoded path of the main revlog file"""

602

"""unencoded path of the main revlog file"""

603

return self._path_prefix + b'.i'

603

return self._path_prefix + b'.i'

604

605

def files(self) -> List[StoreFile]:

605

def files(self) -> List[StoreFile]:

606

if self._files is None:

606

if self._files is None:

607

self._files = []

607

self._files = []

608

for ext in sorted(self._details, key=_ext_key):

608

for ext in sorted(self._details, key=_ext_key):

609

path = self._path_prefix + ext

609

path = self._path_prefix + ext

610

data = self._details[ext]

610

data = self._details[ext]

611

self._files.append(StoreFile(unencoded_path=path, **data))

611

# files that are "volatile" and might change between

612

# listing and streaming

613

#

614

# note: the ".nd" file are nodemap data and won't "change"

615

# but they might be deleted.

616

volatile = ext.endswith(REVLOG_FILES_VOLATILE_EXT)

617

f = StoreFile(unencoded_path=path, is_volatile=volatile, **data)

618

self._files.append(f)

612

return self._files

619

return self._files

613

620

614

def get_streams(

621

def get_streams(

615

self,

622

self,

616

repo=None,

623

repo=None,

617

vfs=None,

624

vfs=None,

618

copies=None,

625

copies=None,

619

max_changeset=None,

626

max_changeset=None,

620

):

627

):

621

if repo is None or max_changeset is None:

628

if repo is None or max_changeset is None:

622

return super().get_streams(

629

return super().get_streams(

623

repo=repo,

630

repo=repo,

624

vfs=vfs,

631

vfs=vfs,

625

copies=copies,

632

copies=copies,

626

max_changeset=max_changeset,

633

max_changeset=max_changeset,

627

)

634

)

628

if any(k.endswith(b'.idx') for k in self._details.keys()):

635

if any(k.endswith(b'.idx') for k in self._details.keys()):

629

# This use revlog-v2, ignore for now

636

# This use revlog-v2, ignore for now

630

return super().get_streams(

637

return super().get_streams(

631

repo=repo,

638

repo=repo,

632

vfs=vfs,

639

vfs=vfs,

633

copies=copies,

640

copies=copies,

634

max_changeset=max_changeset,

641

max_changeset=max_changeset,

635

)

642

)

636

name_to_ext = {}

643

name_to_ext = {}

637

for ext in self._details.keys():

644

for ext in self._details.keys():

638

name_to_ext[self._path_prefix + ext] = ext

645

name_to_ext[self._path_prefix + ext] = ext

639

name_to_size = {}

646

name_to_size = {}

640

for f in self.files():

647

for f in self.files():

641

name_to_size[f.unencoded_path] = f.file_size(None)

648

name_to_size[f.unencoded_path] = f.file_size(None)

642

stream = [

649

stream = [

643

f.get_stream(vfs, copies)

650

f.get_stream(vfs, copies)

644

for f in self.files()

651

for f in self.files()

645

if name_to_ext[f.unencoded_path] not in (b'.d', b'.i')

652

if name_to_ext[f.unencoded_path] not in (b'.d', b'.i')

646

]

653

]

647

654

648

is_inline = b'.d' not in self._details

655

is_inline = b'.d' not in self._details

649

656

650

rl = self.get_revlog_instance(repo).get_revlog()

657

rl = self.get_revlog_instance(repo).get_revlog()

651

rl_stream = rl.get_streams(max_changeset, force_inline=is_inline)

658

rl_stream = rl.get_streams(max_changeset, force_inline=is_inline)

652

659

653

for name, s, size in rl_stream:

660

for name, s, size in rl_stream:

654

if name_to_size.get(name, 0) != size:

661

if name_to_size.get(name, 0) != size:

655

msg = _(b"expected %d bytes but %d provided for %s")

662

msg = _(b"expected %d bytes but %d provided for %s")

656

msg %= name_to_size.get(name, 0), size, name

663

msg %= name_to_size.get(name, 0), size, name

657

raise error.Abort(msg)

664

raise error.Abort(msg)

658

stream.extend(rl_stream)

665

stream.extend(rl_stream)

659

files = self.files()

666

files = self.files()

660

assert len(stream) == len(files), (

667

assert len(stream) == len(files), (

661

stream,

668

stream,

662

files,

669

files,

663

self._path_prefix,

670

self._path_prefix,

664

self.target_id,

671

self.target_id,

665

)

672

)

666

return stream

673

return stream

667

674

668

def get_revlog_instance(self, repo):

675

def get_revlog_instance(self, repo):

669

"""Obtain a revlog instance from this store entry

676

"""Obtain a revlog instance from this store entry

670

677

671

An instance of the appropriate class is returned.

678

An instance of the appropriate class is returned.

672

"""

679

"""

673

if self.is_changelog:

680

if self.is_changelog:

674

return changelog.changelog(repo.svfs)

681

return changelog.changelog(repo.svfs)

675

elif self.is_manifestlog:

682

elif self.is_manifestlog:

676

mandir = self.target_id

683

mandir = self.target_id

677

return manifest.manifestrevlog(

684

return manifest.manifestrevlog(

678

repo.nodeconstants, repo.svfs, tree=mandir

685

repo.nodeconstants, repo.svfs, tree=mandir

679

)

686

)

680

else:

687

else:

681

return filelog.filelog(repo.svfs, self.target_id)

688

return filelog.filelog(repo.svfs, self.target_id)

682

689

683

690

684

def _gather_revlog(files_data):

691

def _gather_revlog(files_data):

685

"""group files per revlog prefix

692

"""group files per revlog prefix

686

693

687

The returns a two level nested dict. The top level key is the revlog prefix

694

The returns a two level nested dict. The top level key is the revlog prefix

688

without extension, the second level is all the file "suffix" that were

695

without extension, the second level is all the file "suffix" that were

689

seen for this revlog and arbitrary file data as value.

696

seen for this revlog and arbitrary file data as value.

690

"""

697

"""

691

revlogs = collections.defaultdict(dict)

698

revlogs = collections.defaultdict(dict)

692

for u, value in files_data:

699

for u, value in files_data:

693

name, ext = _split_revlog_ext(u)

700

name, ext = _split_revlog_ext(u)

694

revlogs[name][ext] = value

701

revlogs[name][ext] = value

695

return sorted(revlogs.items())

702

return sorted(revlogs.items())

696

703

697

704

698

def _split_revlog_ext(filename):

705

def _split_revlog_ext(filename):

699

"""split the revlog file prefix from the variable extension"""

706

"""split the revlog file prefix from the variable extension"""

700

if filename.endswith(REVLOG_FILES_LONG_EXT):

707

if filename.endswith(REVLOG_FILES_LONG_EXT):

701

char = b'-'

708

char = b'-'

702

else:

709

else:

703

char = b'.'

710

char = b'.'

704

idx = filename.rfind(char)

711

idx = filename.rfind(char)

705

return filename[:idx], filename[idx:]

712

return filename[:idx], filename[idx:]

706

713

707

714

708

def _ext_key(ext):

715

def _ext_key(ext):

709

"""a key to order revlog suffix

716

"""a key to order revlog suffix

710

717

711

important to issue .i after other entry."""

718

important to issue .i after other entry."""

712

# the only important part of this order is to keep the `.i` last.

719

# the only important part of this order is to keep the `.i` last.

713

if ext.endswith(b'.n'):

720

if ext.endswith(b'.n'):

714

return (0, ext)

721

return (0, ext)

715

elif ext.endswith(b'.nd'):

722

elif ext.endswith(b'.nd'):

716

return (10, ext)

723

return (10, ext)

717

elif ext.endswith(b'.d'):

724

elif ext.endswith(b'.d'):

718

return (20, ext)

725

return (20, ext)

719

elif ext.endswith(b'.i'):

726

elif ext.endswith(b'.i'):

720

return (50, ext)

727

return (50, ext)

721

else:

728

else:

722

return (40, ext)

729

return (40, ext)

723

730

724

731

725

class basicstore:

732

class basicstore:

726

'''base class for local repository stores'''

733

'''base class for local repository stores'''

727

734

728

def __init__(self, path, vfstype):

735

def __init__(self, path, vfstype):

729

vfs = vfstype(path)

736

vfs = vfstype(path)

730

self.path = vfs.base

737

self.path = vfs.base

731

self.createmode = _calcmode(vfs)

738

self.createmode = _calcmode(vfs)

732

vfs.createmode = self.createmode

739

vfs.createmode = self.createmode

733

self.rawvfs = vfs

740

self.rawvfs = vfs

734

self.vfs = vfsmod.filtervfs(vfs, encodedir)

741

self.vfs = vfsmod.filtervfs(vfs, encodedir)

735

self.opener = self.vfs

742

self.opener = self.vfs

736

743

737

def join(self, f):

744

def join(self, f):

738

return self.path + b'/' + encodedir(f)

745

return self.path + b'/' + encodedir(f)

739

746

740

def _walk(self, relpath, recurse, undecodable=None):

747

def _walk(self, relpath, recurse, undecodable=None):

741

'''yields (revlog_type, unencoded, size)'''

748

'''yields (revlog_type, unencoded, size)'''

742

path = self.path

749

path = self.path

743

if relpath:

750

if relpath:

744

path += b'/' + relpath

751

path += b'/' + relpath

745

striplen = len(self.path) + 1

752

striplen = len(self.path) + 1

746

l = []

753

l = []

747

if self.rawvfs.isdir(path):

754

if self.rawvfs.isdir(path):

748

visit = [path]

755

visit = [path]

749

readdir = self.rawvfs.readdir

756

readdir = self.rawvfs.readdir

750

while visit:

757

while visit:

751

p = visit.pop()

758

p = visit.pop()

752

for f, kind, st in readdir(p, stat=True):

759

for f, kind, st in readdir(p, stat=True):

753

fp = p + b'/' + f

760

fp = p + b'/' + f

754

rl_type = is_revlog(f, kind, st)

761

rl_type = is_revlog(f, kind, st)

755

if rl_type is not None:

762

if rl_type is not None:

756

n = util.pconvert(fp[striplen:])

763

n = util.pconvert(fp[striplen:])

757

l.append((decodedir(n), (rl_type, st.st_size)))

764

l.append((decodedir(n), (rl_type, st.st_size)))

758

elif kind == stat.S_IFDIR and recurse:

765

elif kind == stat.S_IFDIR and recurse:

759

visit.append(fp)

766

visit.append(fp)

760

767

761

l.sort()

768

l.sort()

762

return l

769

return l

763

770

764

def changelog(self, trypending, concurrencychecker=None):

771

def changelog(self, trypending, concurrencychecker=None):

765

return changelog.changelog(

772

return changelog.changelog(

766

self.vfs,

773

self.vfs,

767

trypending=trypending,

774

trypending=trypending,

768

concurrencychecker=concurrencychecker,

775

concurrencychecker=concurrencychecker,

769

)

776

)

770

777

771

def manifestlog(self, repo, storenarrowmatch):

778

def manifestlog(self, repo, storenarrowmatch):

772

rootstore = manifest.manifestrevlog(repo.nodeconstants, self.vfs)

779

rootstore = manifest.manifestrevlog(repo.nodeconstants, self.vfs)

773

return manifest.manifestlog(self.vfs, repo, rootstore, storenarrowmatch)

780

return manifest.manifestlog(self.vfs, repo, rootstore, storenarrowmatch)

774

781

775

def data_entries(

782

def data_entries(

776

self, matcher=None, undecodable=None

783

self, matcher=None, undecodable=None

777

) -> Generator[BaseStoreEntry, None, None]:

784

) -> Generator[BaseStoreEntry, None, None]:

778

"""Like walk, but excluding the changelog and root manifest.

785

"""Like walk, but excluding the changelog and root manifest.

779

786

780

When [undecodable] is None, revlogs names that can't be

787

When [undecodable] is None, revlogs names that can't be

781

decoded cause an exception. When it is provided, it should

788

decoded cause an exception. When it is provided, it should

782

be a list and the filenames that can't be decoded are added

789

be a list and the filenames that can't be decoded are added

783

to it instead. This is very rarely needed."""

790

to it instead. This is very rarely needed."""

784

dirs = [

791

dirs = [

785

(b'data', FILEFLAGS_FILELOG, False),

792

(b'data', FILEFLAGS_FILELOG, False),

786

(b'meta', FILEFLAGS_MANIFESTLOG, True),

793

(b'meta', FILEFLAGS_MANIFESTLOG, True),

787

]

794

]

788

for base_dir, rl_type, strip_filename in dirs:

795

for base_dir, rl_type, strip_filename in dirs:

789

files = self._walk(base_dir, True, undecodable=undecodable)

796

files = self._walk(base_dir, True, undecodable=undecodable)

790

files = (f for f in files if f[1][0] is not None)

797

files = (f for f in files if f[1][0] is not None)

791

for revlog, details in _gather_revlog(files):

798

for revlog, details in _gather_revlog(files):

792

file_details = {}

799

file_details = {}

793

revlog_target_id = revlog.split(b'/', 1)[1]

800

revlog_target_id = revlog.split(b'/', 1)[1]

794

if strip_filename and b'/' in revlog:

801

if strip_filename and b'/' in revlog:

795

revlog_target_id = revlog_target_id.rsplit(b'/', 1)[0]

802

revlog_target_id = revlog_target_id.rsplit(b'/', 1)[0]

796

revlog_target_id += b'/'

803

revlog_target_id += b'/'

797

for ext, (t, s) in sorted(details.items()):

804

for ext, (t, s) in sorted(details.items()):

798

file_details[ext] = {

805

file_details[ext] = {

799

'is_volatile': bool(t & FILEFLAGS_VOLATILE),

800

'file_size': s,

806

'file_size': s,

801

}

807

}

802

yield RevlogStoreEntry(

808

yield RevlogStoreEntry(

803

path_prefix=revlog,

809

path_prefix=revlog,

804

revlog_type=rl_type,

810

revlog_type=rl_type,

805

target_id=revlog_target_id,

811

target_id=revlog_target_id,

806

details=file_details,

812

details=file_details,

807

)

813

)

808

814

809

def top_entries(

815

def top_entries(

810

self, phase=False, obsolescence=False

816

self, phase=False, obsolescence=False

811

) -> Generator[BaseStoreEntry, None, None]:

817

) -> Generator[BaseStoreEntry, None, None]:

812

if phase and self.vfs.exists(b'phaseroots'):

818

if phase and self.vfs.exists(b'phaseroots'):

813

yield SimpleStoreEntry(

819

yield SimpleStoreEntry(

814

entry_path=b'phaseroots',

820

entry_path=b'phaseroots',

815

is_volatile=True,

821

is_volatile=True,

816

)

822

)

817

823

818

if obsolescence and self.vfs.exists(b'obsstore'):

824

if obsolescence and self.vfs.exists(b'obsstore'):

819

# XXX if we had the file size it could be non-volatile

825

# XXX if we had the file size it could be non-volatile

820

yield SimpleStoreEntry(

826

yield SimpleStoreEntry(

821

entry_path=b'obsstore',

827

entry_path=b'obsstore',

822

is_volatile=True,

828

is_volatile=True,

823

)

829

)

824

830

825

files = reversed(self._walk(b'', False))

831

files = reversed(self._walk(b'', False))

826

832

827

changelogs = collections.defaultdict(dict)

833

changelogs = collections.defaultdict(dict)

828

manifestlogs = collections.defaultdict(dict)

834

manifestlogs = collections.defaultdict(dict)

829

835

830

for u, (t, s) in files:

836

for u, (t, s) in files:

831

if u.startswith(b'00changelog'):

837

if u.startswith(b'00changelog'):

832

name, ext = _split_revlog_ext(u)

838

name, ext = _split_revlog_ext(u)

833

changelogs[name][ext] = (t, s)

839

changelogs[name][ext] = (t, s)

834

elif u.startswith(b'00manifest'):

840

elif u.startswith(b'00manifest'):

835

name, ext = _split_revlog_ext(u)

841

name, ext = _split_revlog_ext(u)

836

manifestlogs[name][ext] = (t, s)

842

manifestlogs[name][ext] = (t, s)

837

else:

843

else:

838

yield SimpleStoreEntry(

844

yield SimpleStoreEntry(

839

entry_path=u,

845

entry_path=u,

840

is_volatile=bool(t & FILEFLAGS_VOLATILE),

846

is_volatile=bool(t & FILEFLAGS_VOLATILE),

841

file_size=s,

847

file_size=s,

842

)

848

)

843

# yield manifest before changelog

849

# yield manifest before changelog

844

top_rl = [

850

top_rl = [

845

(manifestlogs, FILEFLAGS_MANIFESTLOG),

851

(manifestlogs, FILEFLAGS_MANIFESTLOG),

846

(changelogs, FILEFLAGS_CHANGELOG),

852

(changelogs, FILEFLAGS_CHANGELOG),

847

]

853

]

848

assert len(manifestlogs) <= 1

854

assert len(manifestlogs) <= 1

849

assert len(changelogs) <= 1

855

assert len(changelogs) <= 1

850

for data, revlog_type in top_rl:

856

for data, revlog_type in top_rl:

851

for revlog, details in sorted(data.items()):

857

for revlog, details in sorted(data.items()):

852

file_details = {}

858

file_details = {}

853

for ext, (t, s) in details.items():

859

for ext, (t, s) in details.items():

854

file_details[ext] = {

860

file_details[ext] = {

855

'is_volatile': bool(t & FILEFLAGS_VOLATILE),

856

'file_size': s,

861

'file_size': s,

857

}

862

}

858

yield RevlogStoreEntry(

863

yield RevlogStoreEntry(

859

path_prefix=revlog,

864

path_prefix=revlog,

860

revlog_type=revlog_type,

865

revlog_type=revlog_type,

861

target_id=b'',

866

target_id=b'',

862

details=file_details,

867

details=file_details,

863

)

868

)

864

869

865

def walk(

870

def walk(

866

self, matcher=None, phase=False, obsolescence=False

871

self, matcher=None, phase=False, obsolescence=False

867

) -> Generator[BaseStoreEntry, None, None]:

872

) -> Generator[BaseStoreEntry, None, None]:

868

"""return files related to data storage (ie: revlogs)

873

"""return files related to data storage (ie: revlogs)

869

874

870

yields instance from BaseStoreEntry subclasses

875

yields instance from BaseStoreEntry subclasses

871

876

872

if a matcher is passed, storage files of only those tracked paths

877

if a matcher is passed, storage files of only those tracked paths

873

are passed with matches the matcher

878

are passed with matches the matcher

874

"""

879

"""

875

# yield data files first

880

# yield data files first

876

for x in self.data_entries(matcher):

881

for x in self.data_entries(matcher):

877

yield x

882

yield x

878

for x in self.top_entries(phase=phase, obsolescence=obsolescence):

883

for x in self.top_entries(phase=phase, obsolescence=obsolescence):

879

yield x

884

yield x

880

885

881

def copylist(self):

886

def copylist(self):

882

return _data

887

return _data

883

888

884

def write(self, tr):

889

def write(self, tr):

885

pass

890

pass

886

891

887

def invalidatecaches(self):

892

def invalidatecaches(self):

888

pass

893

pass

889

894

890

def markremoved(self, fn):

895

def markremoved(self, fn):

891

pass

896

pass

892

897

893

def __contains__(self, path):

898

def __contains__(self, path):

894

'''Checks if the store contains path'''

899

'''Checks if the store contains path'''

895

path = b"/".join((b"data", path))

900

path = b"/".join((b"data", path))

896

# file?

901

# file?

897

if self.vfs.exists(path + b".i"):

902

if self.vfs.exists(path + b".i"):

898

return True

903

return True

899

# dir?

904

# dir?

900

if not path.endswith(b"/"):

905

if not path.endswith(b"/"):

901

path = path + b"/"

906

path = path + b"/"

902

return self.vfs.exists(path)

907

return self.vfs.exists(path)

903

908

904

909

905

class encodedstore(basicstore):

910

class encodedstore(basicstore):

906

def __init__(self, path, vfstype):

911

def __init__(self, path, vfstype):

907

vfs = vfstype(path + b'/store')

912

vfs = vfstype(path + b'/store')

908

self.path = vfs.base

913

self.path = vfs.base

909

self.createmode = _calcmode(vfs)

914

self.createmode = _calcmode(vfs)

910

vfs.createmode = self.createmode

915

vfs.createmode = self.createmode

911

self.rawvfs = vfs

916

self.rawvfs = vfs

912

self.vfs = vfsmod.filtervfs(vfs, encodefilename)

917

self.vfs = vfsmod.filtervfs(vfs, encodefilename)

913

self.opener = self.vfs

918

self.opener = self.vfs

914

919

915

def _walk(self, relpath, recurse, undecodable=None):

920

def _walk(self, relpath, recurse, undecodable=None):

916

old = super()._walk(relpath, recurse)

921

old = super()._walk(relpath, recurse)

917

new = []

922

new = []

918

for f1, value in old:

923

for f1, value in old:

919

try:

924

try:

920

f2 = decodefilename(f1)

925

f2 = decodefilename(f1)

921

except KeyError:

926

except KeyError:

922

if undecodable is None:

927

if undecodable is None:

923

msg = _(b'undecodable revlog name %s') % f1

928

msg = _(b'undecodable revlog name %s') % f1

924

raise error.StorageError(msg)

929

raise error.StorageError(msg)

925

else:

930

else:

926

undecodable.append(f1)

931

undecodable.append(f1)

927

continue

932

continue

928

new.append((f2, value))

933

new.append((f2, value))

929

return new

934

return new

930

935

931

def data_entries(

936

def data_entries(

932

self, matcher=None, undecodable=None

937

self, matcher=None, undecodable=None

933

) -> Generator[BaseStoreEntry, None, None]:

938

) -> Generator[BaseStoreEntry, None, None]:

934

entries = super(encodedstore, self).data_entries(

939

entries = super(encodedstore, self).data_entries(

935

undecodable=undecodable

940

undecodable=undecodable

936

)

941

)

937

for entry in entries:

942

for entry in entries:

938

if _match_tracked_entry(entry, matcher):

943

if _match_tracked_entry(entry, matcher):

939

yield entry

944

yield entry

940

945

941

def join(self, f):

946

def join(self, f):

942

return self.path + b'/' + encodefilename(f)

947

return self.path + b'/' + encodefilename(f)

943

948

944

def copylist(self):

949

def copylist(self):

945

return [b'requires', b'00changelog.i'] + [b'store/' + f for f in _data]

950

return [b'requires', b'00changelog.i'] + [b'store/' + f for f in _data]

946

951

947

952

948

class fncache:

953

class fncache:

949

# the filename used to be partially encoded

954

# the filename used to be partially encoded

950

# hence the encodedir/decodedir dance

955

# hence the encodedir/decodedir dance

951

def __init__(self, vfs):

956

def __init__(self, vfs):

952

self.vfs = vfs

957

self.vfs = vfs

953

self._ignores = set()

958

self._ignores = set()

954

self.entries = None

959

self.entries = None

955

self._dirty = False

960

self._dirty = False

956

# set of new additions to fncache

961

# set of new additions to fncache

957

self.addls = set()

962

self.addls = set()

958

963

959

def ensureloaded(self, warn=None):

964

def ensureloaded(self, warn=None):

960

"""read the fncache file if not already read.

965

"""read the fncache file if not already read.

961

966

962

If the file on disk is corrupted, raise. If warn is provided,

967

If the file on disk is corrupted, raise. If warn is provided,

963

warn and keep going instead."""

968

warn and keep going instead."""

964

if self.entries is None:

969

if self.entries is None:

965

self._load(warn)

970

self._load(warn)

966

971

967

def _load(self, warn=None):

972

def _load(self, warn=None):

968

'''fill the entries from the fncache file'''

973

'''fill the entries from the fncache file'''

969

self._dirty = False

974

self._dirty = False

970

try:

975

try:

971

fp = self.vfs(b'fncache', mode=b'rb')

976

fp = self.vfs(b'fncache', mode=b'rb')

972

except IOError:

977

except IOError:

973

# skip nonexistent file

978

# skip nonexistent file

974

self.entries = set()

979

self.entries = set()

975

return

980

return

976

981

977

self.entries = set()

982

self.entries = set()

978

chunk = b''

983

chunk = b''

979

for c in iter(functools.partial(fp.read, fncache_chunksize), b''):

984

for c in iter(functools.partial(fp.read, fncache_chunksize), b''):

980

chunk += c

985

chunk += c

981

try:

986

try:

982

p = chunk.rindex(b'\n')

987

p = chunk.rindex(b'\n')

983

self.entries.update(decodedir(chunk[: p + 1]).splitlines())

988

self.entries.update(decodedir(chunk[: p + 1]).splitlines())

984

chunk = chunk[p + 1 :]

989

chunk = chunk[p + 1 :]

985

except ValueError:

990

except ValueError:

986

# substring '\n' not found, maybe the entry is bigger than the

991

# substring '\n' not found, maybe the entry is bigger than the

987

# chunksize, so let's keep iterating

992

# chunksize, so let's keep iterating

988

pass

993

pass

989

994

990

if chunk:

995

if chunk:

991

msg = _(b"fncache does not ends with a newline")

996

msg = _(b"fncache does not ends with a newline")

992

if warn:

997

if warn:

993

warn(msg + b'\n')

998

warn(msg + b'\n')

994

else:

999

else:

995

raise error.Abort(

1000

raise error.Abort(

996

msg,

1001

msg,

997

hint=_(

1002

hint=_(

998

b"use 'hg debugrebuildfncache' to "

1003

b"use 'hg debugrebuildfncache' to "

999

b"rebuild the fncache"

1004

b"rebuild the fncache"

1000

),

1005

),

1001

)

1006

)

1002

self._checkentries(fp, warn)

1007

self._checkentries(fp, warn)

1003

fp.close()

1008

fp.close()

1004

1009

1005

def _checkentries(self, fp, warn):

1010

def _checkentries(self, fp, warn):

1006

"""make sure there is no empty string in entries"""

1011

"""make sure there is no empty string in entries"""

1007

if b'' in self.entries:

1012

if b'' in self.entries:

1008

fp.seek(0)

1013

fp.seek(0)

1009

for n, line in enumerate(fp):

1014

for n, line in enumerate(fp):

1010

if not line.rstrip(b'\n'):

1015

if not line.rstrip(b'\n'):

1011

t = _(b'invalid entry in fncache, line %d') % (n + 1)

1016

t = _(b'invalid entry in fncache, line %d') % (n + 1)

1012

if warn:

1017

if warn:

1013

warn(t + b'\n')

1018

warn(t + b'\n')

1014

else:

1019

else:

1015

raise error.Abort(t)

1020

raise error.Abort(t)

1016

1021

1017

def write(self, tr):

1022

def write(self, tr):

1018

if self._dirty:

1023

if self._dirty:

1019

assert self.entries is not None

1024

assert self.entries is not None

1020

self.entries = self.entries | self.addls

1025

self.entries = self.entries | self.addls

1021

self.addls = set()

1026

self.addls = set()

1022

tr.addbackup(b'fncache')

1027

tr.addbackup(b'fncache')

1023

fp = self.vfs(b'fncache', mode=b'wb', atomictemp=True)

1028

fp = self.vfs(b'fncache', mode=b'wb', atomictemp=True)

1024

if self.entries:

1029

if self.entries:

1025

fp.write(encodedir(b'\n'.join(self.entries) + b'\n'))

1030

fp.write(encodedir(b'\n'.join(self.entries) + b'\n'))

1026

fp.close()

1031

fp.close()

1027

self._dirty = False

1032

self._dirty = False

1028

if self.addls:

1033

if self.addls:

1029

# if we have just new entries, let's append them to the fncache

1034

# if we have just new entries, let's append them to the fncache

1030

tr.addbackup(b'fncache')

1035

tr.addbackup(b'fncache')

1031

fp = self.vfs(b'fncache', mode=b'ab', atomictemp=True)

1036

fp = self.vfs(b'fncache', mode=b'ab', atomictemp=True)

1032

if self.addls:

1037

if self.addls:

1033

fp.write(encodedir(b'\n'.join(self.addls) + b'\n'))

1038

fp.write(encodedir(b'\n'.join(self.addls) + b'\n'))

1034

fp.close()

1039

fp.close()

1035

self.entries = None

1040

self.entries = None

1036

self.addls = set()

1041

self.addls = set()

1037

1042

1038

def addignore(self, fn):

1043

def addignore(self, fn):

1039

self._ignores.add(fn)

1044

self._ignores.add(fn)

1040

1045

1041

def add(self, fn):

1046

def add(self, fn):

1042

if fn in self._ignores:

1047

if fn in self._ignores:

1043

return

1048

return

1044

if self.entries is None:

1049

if self.entries is None:

1045

self._load()

1050

self._load()

1046

if fn not in self.entries:

1051

if fn not in self.entries:

1047

self.addls.add(fn)

1052

self.addls.add(fn)

1048

1053

1049

def remove(self, fn):

1054

def remove(self, fn):

1050

if self.entries is None:

1055

if self.entries is None:

1051

self._load()

1056

self._load()

1052

if fn in self.addls:

1057

if fn in self.addls:

1053

self.addls.remove(fn)

1058

self.addls.remove(fn)

1054

return

1059

return

1055

try:

1060

try:

1056

self.entries.remove(fn)

1061

self.entries.remove(fn)

1057

self._dirty = True

1062

self._dirty = True

1058

except KeyError:

1063

except KeyError:

1059

pass

1064

pass

1060

1065

1061

def __contains__(self, fn):

1066

def __contains__(self, fn):

1062

if fn in self.addls:

1067

if fn in self.addls:

1063

return True

1068

return True

1064

if self.entries is None:

1069

if self.entries is None:

1065

self._load()

1070

self._load()

1066

return fn in self.entries

1071

return fn in self.entries

1067

1072

1068

def __iter__(self):

1073

def __iter__(self):

1069

if self.entries is None:

1074

if self.entries is None:

1070

self._load()

1075

self._load()

1071

return iter(self.entries | self.addls)

1076

return iter(self.entries | self.addls)

1072

1077

1073

1078

1074

class _fncachevfs(vfsmod.proxyvfs):

1079

class _fncachevfs(vfsmod.proxyvfs):

1075

def __init__(self, vfs, fnc, encode):

1080

def __init__(self, vfs, fnc, encode):

1076

vfsmod.proxyvfs.__init__(self, vfs)

1081

vfsmod.proxyvfs.__init__(self, vfs)

1077

self.fncache = fnc

1082

self.fncache = fnc

1078

self.encode = encode

1083

self.encode = encode

1079

1084

1080

def __call__(self, path, mode=b'r', *args, **kw):

1085

def __call__(self, path, mode=b'r', *args, **kw):

1081

encoded = self.encode(path)

1086

encoded = self.encode(path)

1082

if (

1087

if (

1083

mode not in (b'r', b'rb')

1088

mode not in (b'r', b'rb')

1084

and (path.startswith(b'data/') or path.startswith(b'meta/'))

1089

and (path.startswith(b'data/') or path.startswith(b'meta/'))

1085

and revlog_type(path) is not None

1090

and revlog_type(path) is not None

1086

):

1091

):

1087

# do not trigger a fncache load when adding a file that already is

1092

# do not trigger a fncache load when adding a file that already is

1088

# known to exist.

1093

# known to exist.

1089

notload = self.fncache.entries is None and self.vfs.exists(encoded)

1094

notload = self.fncache.entries is None and self.vfs.exists(encoded)

1090

if notload and b'r+' in mode and not self.vfs.stat(encoded).st_size:

1095

if notload and b'r+' in mode and not self.vfs.stat(encoded).st_size:

1091

# when appending to an existing file, if the file has size zero,

1096

# when appending to an existing file, if the file has size zero,

1092

# it should be considered as missing. Such zero-size files are

1097

# it should be considered as missing. Such zero-size files are

1093

# the result of truncation when a transaction is aborted.

1098

# the result of truncation when a transaction is aborted.

1094

notload = False

1099

notload = False

1095

if not notload:

1100

if not notload:

1096

self.fncache.add(path)

1101

self.fncache.add(path)

1097

return self.vfs(encoded, mode, *args, **kw)

1102

return self.vfs(encoded, mode, *args, **kw)

1098

1103

1099

def join(self, path):

1104

def join(self, path):

1100

if path:

1105

if path:

1101

return self.vfs.join(self.encode(path))

1106

return self.vfs.join(self.encode(path))

1102

else:

1107

else:

1103

return self.vfs.join(path)

1108

return self.vfs.join(path)

1104

1109

1105

def register_file(self, path):

1110

def register_file(self, path):

1106

"""generic hook point to lets fncache steer its stew"""

1111

"""generic hook point to lets fncache steer its stew"""

1107

if path.startswith(b'data/') or path.startswith(b'meta/'):

1112

if path.startswith(b'data/') or path.startswith(b'meta/'):

1108

self.fncache.add(path)

1113

self.fncache.add(path)

1109

1114

1110

1115

1111

class fncachestore(basicstore):

1116

class fncachestore(basicstore):

1112

def __init__(self, path, vfstype, dotencode):

1117

def __init__(self, path, vfstype, dotencode):

1113

if dotencode:

1118

if dotencode:

1114

encode = _pathencode

1119

encode = _pathencode

1115

else:

1120

else:

1116

encode = _plainhybridencode

1121

encode = _plainhybridencode

1117

self.encode = encode

1122

self.encode = encode

1118

vfs = vfstype(path + b'/store')

1123

vfs = vfstype(path + b'/store')

1119

self.path = vfs.base

1124

self.path = vfs.base

1120

self.pathsep = self.path + b'/'

1125

self.pathsep = self.path + b'/'

1121

self.createmode = _calcmode(vfs)

1126

self.createmode = _calcmode(vfs)

1122

vfs.createmode = self.createmode

1127

vfs.createmode = self.createmode

1123

self.rawvfs = vfs

1128

self.rawvfs = vfs

1124

fnc = fncache(vfs)

1129

fnc = fncache(vfs)

1125

self.fncache = fnc

1130

self.fncache = fnc

1126

self.vfs = _fncachevfs(vfs, fnc, encode)

1131

self.vfs = _fncachevfs(vfs, fnc, encode)

1127

self.opener = self.vfs

1132

self.opener = self.vfs

1128

1133

1129

def join(self, f):

1134

def join(self, f):

1130

return self.pathsep + self.encode(f)

1135

return self.pathsep + self.encode(f)

1131

1136

1132

def getsize(self, path):

1137

def getsize(self, path):

1133

return self.rawvfs.stat(path).st_size

1138

return self.rawvfs.stat(path).st_size

1134

1139

1135

def data_entries(

1140

def data_entries(

1136

self, matcher=None, undecodable=None

1141

self, matcher=None, undecodable=None

1137

) -> Generator[BaseStoreEntry, None, None]:

1142

) -> Generator[BaseStoreEntry, None, None]:

1138

files = ((f, revlog_type(f)) for f in self.fncache)

1143

files = ((f, revlog_type(f)) for f in self.fncache)

1139

# Note: all files in fncache should be revlog related, However the

1144

# Note: all files in fncache should be revlog related, However the

1140

# fncache might contains such file added by previous version of

1145

# fncache might contains such file added by previous version of

1141

# Mercurial.

1146

# Mercurial.

1142

files = (f for f in files if f[1] is not None)

1147

files = (f for f in files if f[1] is not None)

1143

by_revlog = _gather_revlog(files)

1148

by_revlog = _gather_revlog(files)

1144

for revlog, details in by_revlog:

1149

for revlog, details in by_revlog:

1145

file_details = {}

1150

file_details = {}

1146

if revlog.startswith(b'data/'):

1151

if revlog.startswith(b'data/'):

1147

rl_type = FILEFLAGS_FILELOG

1152

rl_type = FILEFLAGS_FILELOG

1148

revlog_target_id = revlog.split(b'/', 1)[1]

1153

revlog_target_id = revlog.split(b'/', 1)[1]

1149

elif revlog.startswith(b'meta/'):

1154

elif revlog.startswith(b'meta/'):

1150

rl_type = FILEFLAGS_MANIFESTLOG

1155

rl_type = FILEFLAGS_MANIFESTLOG

1151

# drop the initial directory and the `00manifest` file part

1156

# drop the initial directory and the `00manifest` file part

1152

tmp = revlog.split(b'/', 1)[1]

1157

tmp = revlog.split(b'/', 1)[1]

1153

revlog_target_id = tmp.rsplit(b'/', 1)[0] + b'/'

1158

revlog_target_id = tmp.rsplit(b'/', 1)[0] + b'/'

1154

else:

1159

else:

1155

# unreachable

1160

# unreachable

1156

assert False, revlog

1161

assert False, revlog

1157

for ext, t in details.items():

1162

for ext, t in details.items():

1158

file_details[ext] = {

1163

file_details[ext] = {}

1159

'is_volatile': bool(t & FILEFLAGS_VOLATILE),

1160

}

1161

entry = RevlogStoreEntry(

1164

entry = RevlogStoreEntry(

1162

path_prefix=revlog,

1165

path_prefix=revlog,

1163

revlog_type=rl_type,

1166

revlog_type=rl_type,

1164

target_id=revlog_target_id,

1167

target_id=revlog_target_id,

1165

details=file_details,

1168

details=file_details,

1166

)

1169

)

1167

if _match_tracked_entry(entry, matcher):

1170

if _match_tracked_entry(entry, matcher):

1168

yield entry

1171

yield entry

1169

1172

1170

def copylist(self):

1173

def copylist(self):

1171

d = (

1174

d = (

1172

b'bookmarks',

1175

b'bookmarks',

1173

b'narrowspec',

1176

b'narrowspec',

1174

b'data',

1177

b'data',

1175

b'meta',

1178

b'meta',

1176

b'dh',

1179

b'dh',

1177

b'fncache',

1180

b'fncache',

1178

b'phaseroots',

1181

b'phaseroots',

1179

b'obsstore',

1182

b'obsstore',

1180

b'00manifest.d',

1183

b'00manifest.d',

1181

b'00manifest.i',

1184

b'00manifest.i',

1182

b'00changelog.d',

1185

b'00changelog.d',

1183

b'00changelog.i',

1186

b'00changelog.i',

1184

b'requires',

1187

b'requires',

1185

)

1188

)

1186

return [b'requires', b'00changelog.i'] + [b'store/' + f for f in d]

1189

return [b'requires', b'00changelog.i'] + [b'store/' + f for f in d]

1187

1190

1188

def write(self, tr):

1191

def write(self, tr):

1189

self.fncache.write(tr)

1192

self.fncache.write(tr)

1190

1193

1191

def invalidatecaches(self):

1194

def invalidatecaches(self):

1192

self.fncache.entries = None

1195

self.fncache.entries = None

1193

self.fncache.addls = set()

1196

self.fncache.addls = set()

1194

1197

1195

def markremoved(self, fn):

1198

def markremoved(self, fn):

1196

self.fncache.remove(fn)

1199

self.fncache.remove(fn)

1197

1200

1198

def _exists(self, f):

1201

def _exists(self, f):

1199

ef = self.encode(f)

1202

ef = self.encode(f)

1200

try:

1203

try:

1201

self.getsize(ef)

1204

self.getsize(ef)

1202

return True

1205

return True

1203

except FileNotFoundError:

1206

except FileNotFoundError:

1204

return False

1207

return False

1205

1208

1206

def __contains__(self, path):

1209

def __contains__(self, path):

1207

'''Checks if the store contains path'''

1210

'''Checks if the store contains path'''

1208

path = b"/".join((b"data", path))

1211

path = b"/".join((b"data", path))

1209

# check for files (exact match)

1212

# check for files (exact match)

1210

e = path + b'.i'

1213

e = path + b'.i'

1211

if e in self.fncache and self._exists(e):

1214

if e in self.fncache and self._exists(e):

1212

return True

1215

return True

1213

# now check for directories (prefix match)

1216

# now check for directories (prefix match)

1214

if not path.endswith(b'/'):

1217

if not path.endswith(b'/'):

1215

path += b'/'

1218

path += b'/'

1216

for e in self.fncache:

1219

for e in self.fncache:

1217

if e.startswith(path) and self._exists(e):

1220

if e.startswith(path) and self._exists(e):

1218

return True

1221

return True

1219

return False

1222

return False

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages

             # store.py - repository store handling for Mercurial
             #
             # Copyright 2008 Olivia Mackall <olivia@selenic.com>
             #
             # This software may be used and distributed according to the terms of the
             # GNU General Public License version 2 or any later version.
             import collections
             import functools
             import os
             import re
             import stat
             from typing import Generator, List
             from .i18n import _
             from .pycompat import getattr
             from .thirdparty import attr
             from .node import hex
             from . import (
                 changelog,
                 error,
                 filelog,
                 manifest,
                 policy,
                 pycompat,
                 util,
                 vfs as vfsmod,
             )
             from .utils import hashutil
             parsers = policy.importmod('parsers')
             # how much bytes should be read from fncache in one read
             # It is done to prevent loading large fncache files into memory
             fncache_chunksize = 10 ** 6
             def _match_tracked_entry(entry, matcher):
                 """parses a fncache entry and returns whether the entry is tracking a path
                 matched by matcher or not.
                 If matcher is None, returns True"""
                 if matcher is None:
                     return True
                 if entry.is_filelog:
                     return matcher(entry.target_id)
                 elif entry.is_manifestlog:
                     return matcher.visitdir(entry.target_id.rstrip(b'/'))
                 raise error.ProgrammingError(b"cannot process entry %r" % entry)
             # This avoids a collision between a file named foo and a dir named
             # foo.i or foo.d
             def _encodedir(path):
                 """
                 >>> _encodedir(b'data/foo.i')
                 'data/foo.i'
                 >>> _encodedir(b'data/foo.i/bla.i')
                 'data/foo.i.hg/bla.i'
                 >>> _encodedir(b'data/foo.i.hg/bla.i')
                 'data/foo.i.hg.hg/bla.i'
                 >>> _encodedir(b'data/foo.i\\ndata/foo.i/bla.i\\ndata/foo.i.hg/bla.i\\n')
                 'data/foo.i\\ndata/foo.i.hg/bla.i\\ndata/foo.i.hg.hg/bla.i\\n'
                 """
                 return (
                     path.replace(b".hg/", b".hg.hg/")
                     .replace(b".i/", b".i.hg/")
                     .replace(b".d/", b".d.hg/")
                 )
             encodedir = getattr(parsers, 'encodedir', _encodedir)
             def decodedir(path):
                 """
                 >>> decodedir(b'data/foo.i')
                 'data/foo.i'
                 >>> decodedir(b'data/foo.i.hg/bla.i')
                 'data/foo.i/bla.i'
                 >>> decodedir(b'data/foo.i.hg.hg/bla.i')
                 'data/foo.i.hg/bla.i'
                 """
                 if b".hg/" not in path:
                     return path
                 return (
                     path.replace(b".d.hg/", b".d/")
                     .replace(b".i.hg/", b".i/")
                     .replace(b".hg.hg/", b".hg/")
                 )
             def _reserved():
                 """characters that are problematic for filesystems
                 * ascii escapes (0..31)
                 * ascii hi (126..255)
                 * windows specials
                 these characters will be escaped by encodefunctions
                 """
                 winreserved = [ord(x) for x in u'\\:*?"<>|']
                 for x in range(32):
                     yield x
                 for x in range(126, 256):
                     yield x
                 for x in winreserved:
                     yield x
             def _buildencodefun():
                 """
                 >>> enc, dec = _buildencodefun()
                 >>> enc(b'nothing/special.txt')
                 'nothing/special.txt'
                 >>> dec(b'nothing/special.txt')
                 'nothing/special.txt'
                 >>> enc(b'HELLO')
                 '_h_e_l_l_o'
                 >>> dec(b'_h_e_l_l_o')
                 'HELLO'
                 >>> enc(b'hello:world?')
                 'hello~3aworld~3f'
                 >>> dec(b'hello~3aworld~3f')
                 'hello:world?'
                 >>> enc(b'the\\x07quick\\xADshot')
                 'the~07quick~adshot'
                 >>> dec(b'the~07quick~adshot')
                 'the\\x07quick\\xadshot'
                 """
                 e = b'_'
                 xchr = pycompat.bytechr
                 asciistr = list(map(xchr, range(127)))
                 capitals = list(range(ord(b"A"), ord(b"Z") + 1))
                 cmap = {x: x for x in asciistr}
                 for x in _reserved():
                     cmap[xchr(x)] = b"~%02x" % x
                 for x in capitals + [ord(e)]:
                     cmap[xchr(x)] = e + xchr(x).lower()
                 dmap = {}
                 for k, v in cmap.items():
                     dmap[v] = k
                 def decode(s):
                     i = 0
                     while i < len(s):
                         for l in range(1, 4):
                             try:
                                 yield dmap[s[i : i + l]]
                                 i += l
                                 break
                             except KeyError:
                                 pass
                         else:
                             raise KeyError
                 return (
                     lambda s: b''.join([cmap[s[c : c + 1]] for c in range(len(s))]),
                     lambda s: b''.join(list(decode(s))),
                 )
             _encodefname, _decodefname = _buildencodefun()
             def encodefilename(s):
                 """
                 >>> encodefilename(b'foo.i/bar.d/bla.hg/hi:world?/HELLO')
                 'foo.i.hg/bar.d.hg/bla.hg.hg/hi~3aworld~3f/_h_e_l_l_o'
                 """
                 return _encodefname(encodedir(s))
             def decodefilename(s):
                 """
                 >>> decodefilename(b'foo.i.hg/bar.d.hg/bla.hg.hg/hi~3aworld~3f/_h_e_l_l_o')
                 'foo.i/bar.d/bla.hg/hi:world?/HELLO'
                 """
                 return decodedir(_decodefname(s))
             def _buildlowerencodefun():
                 """
                 >>> f = _buildlowerencodefun()
                 >>> f(b'nothing/special.txt')
                 'nothing/special.txt'
                 >>> f(b'HELLO')
                 'hello'
                 >>> f(b'hello:world?')
                 'hello~3aworld~3f'
                 >>> f(b'the\\x07quick\\xADshot')
                 'the~07quick~adshot'
                 """
                 xchr = pycompat.bytechr
                 cmap = {xchr(x): xchr(x) for x in range(127)}
                 for x in _reserved():
                     cmap[xchr(x)] = b"~%02x" % x
                 for x in range(ord(b"A"), ord(b"Z") + 1):
                     cmap[xchr(x)] = xchr(x).lower()
                 def lowerencode(s):
                     return b"".join([cmap[c] for c in pycompat.iterbytestr(s)])
                 return lowerencode
             lowerencode = getattr(parsers, 'lowerencode', None) or _buildlowerencodefun()
             # Windows reserved names: con, prn, aux, nul, com1..com9, lpt1..lpt9
             _winres3 = (b'aux', b'con', b'prn', b'nul')  # length 3
             _winres4 = (b'com', b'lpt')  # length 4 (with trailing 1..9)
             def _auxencode(path, dotencode):
                 """
                 Encodes filenames containing names reserved by Windows or which end in
                 period or space. Does not touch other single reserved characters c.
                 Specifically, c in '\\:*?"<>|' or ord(c) <= 31 are *not* encoded here.
                 Additionally encodes space or period at the beginning, if dotencode is
                 True. Parameter path is assumed to be all lowercase.
                 A segment only needs encoding if a reserved name appears as a
                 basename (e.g. "aux", "aux.foo"). A directory or file named "foo.aux"
                 doesn't need encoding.
                 >>> s = b'.foo/aux.txt/txt.aux/con/prn/nul/foo.'
                 >>> _auxencode(s.split(b'/'), True)
                 ['~2efoo', 'au~78.txt', 'txt.aux', 'co~6e', 'pr~6e', 'nu~6c', 'foo~2e']
                 >>> s = b'.com1com2/lpt9.lpt4.lpt1/conprn/com0/lpt0/foo.'
                 >>> _auxencode(s.split(b'/'), False)
                 ['.com1com2', 'lp~749.lpt4.lpt1', 'conprn', 'com0', 'lpt0', 'foo~2e']
                 >>> _auxencode([b'foo. '], True)
                 ['foo.~20']
                 >>> _auxencode([b' .foo'], True)
                 ['~20.foo']
                 """
                 for i, n in enumerate(path):
                     if not n:
                         continue
                     if dotencode and n[0] in b'. ':
                         n = b"~%02x" % ord(n[0:1]) + n[1:]
                         path[i] = n
                     else:
                         l = n.find(b'.')
                         if l == -1:
                             l = len(n)
                         if (l == 3 and n[:3] in _winres3) or (
                             l == 4
                             and n[3:4] <= b'9'
                             and n[3:4] >= b'1'
                             and n[:3] in _winres4
                         ):
                             # encode third letter ('aux' -> 'au~78')
                             ec = b"~%02x" % ord(n[2:3])
                             n = n[0:2] + ec + n[3:]
                             path[i] = n
                     if n[-1] in b'. ':
                         # encode last period or space ('foo...' -> 'foo..~2e')
                         path[i] = n[:-1] + b"~%02x" % ord(n[-1:])
                 return path
             _maxstorepathlen = 120
             _dirprefixlen = 8
             _maxshortdirslen = 8 * (_dirprefixlen + 1) - 4
             def _hashencode(path, dotencode):
                 digest = hex(hashutil.sha1(path).digest())
                 le = lowerencode(path[5:]).split(b'/')  # skips prefix 'data/' or 'meta/'
                 parts = _auxencode(le, dotencode)
                 basename = parts[-1]
                 _root, ext = os.path.splitext(basename)
                 sdirs = []
                 sdirslen = 0
                 for p in parts[:-1]:
                     d = p[:_dirprefixlen]
                     if d[-1] in b'. ':
                         # Windows can't access dirs ending in period or space
                         d = d[:-1] + b'_'
                     if sdirslen == 0:
                         t = len(d)
                     else:
                         t = sdirslen + 1 + len(d)
                         if t > _maxshortdirslen:
                             break
                     sdirs.append(d)
                     sdirslen = t
                 dirs = b'/'.join(sdirs)
                 if len(dirs) > 0:
                     dirs += b'/'
                 res = b'dh/' + dirs + digest + ext
                 spaceleft = _maxstorepathlen - len(res)
                 if spaceleft > 0:
                     filler = basename[:spaceleft]
                     res = b'dh/' + dirs + filler + digest + ext
                 return res
             def _hybridencode(path, dotencode):
                 """encodes path with a length limit
                 Encodes all paths that begin with 'data/', according to the following.
                 Default encoding (reversible):
                 Encodes all uppercase letters 'X' as '_x'. All reserved or illegal
                 characters are encoded as '~xx', where xx is the two digit hex code
                 of the character (see encodefilename).
                 Relevant path components consisting of Windows reserved filenames are
                 masked by encoding the third character ('aux' -> 'au~78', see _auxencode).
                 Hashed encoding (not reversible):
                 If the default-encoded path is longer than _maxstorepathlen, a
                 non-reversible hybrid hashing of the path is done instead.
                 This encoding uses up to _dirprefixlen characters of all directory
                 levels of the lowerencoded path, but not more levels than can fit into
                 _maxshortdirslen.
                 Then follows the filler followed by the sha digest of the full path.
                 The filler is the beginning of the basename of the lowerencoded path
                 (the basename is everything after the last path separator). The filler
                 is as long as possible, filling in characters from the basename until
                 the encoded path has _maxstorepathlen characters (or all chars of the
                 basename have been taken).
                 The extension (e.g. '.i' or '.d') is preserved.
                 The string 'data/' at the beginning is replaced with 'dh/', if the hashed
                 encoding was used.
                 """
                 path = encodedir(path)
                 ef = _encodefname(path).split(b'/')
                 res = b'/'.join(_auxencode(ef, dotencode))
                 if len(res) > _maxstorepathlen:
                     res = _hashencode(path, dotencode)
                 return res
             def _pathencode(path):
                 de = encodedir(path)
                 if len(path) > _maxstorepathlen:
                     return _hashencode(de, True)
                 ef = _encodefname(de).split(b'/')
                 res = b'/'.join(_auxencode(ef, True))
                 if len(res) > _maxstorepathlen:
                     return _hashencode(de, True)
                 return res
             _pathencode = getattr(parsers, 'pathencode', _pathencode)
             def _plainhybridencode(f):
                 return _hybridencode(f, False)
             def _calcmode(vfs):
                 try:
                     # files in .hg/ will be created using this mode
                     mode = vfs.stat().st_mode
                     # avoid some useless chmods
                     if (0o777 & ~util.umask) == (0o777 & mode):
                         mode = None
                 except OSError:
                     mode = None
                 return mode
             _data = [
                 b'bookmarks',
                 b'narrowspec',
                 b'data',
                 b'meta',
                 b'00manifest.d',
                 b'00manifest.i',
                 b'00changelog.d',
                 b'00changelog.i',
                 b'phaseroots',
                 b'obsstore',
                 b'requires',
             ]
             REVLOG_FILES_MAIN_EXT = (b'.i',)
             REVLOG_FILES_OTHER_EXT = (
                 b'.idx',
                 b'.d',
                 b'.dat',
                 b'.n',
                 b'.nd',
                 b'.sda',
             )
             # file extension that also use a `-SOMELONGIDHASH.ext` form
             REVLOG_FILES_LONG_EXT = (
                 b'.nd',
                 b'.idx',
                 b'.dat',
                 b'.sda',
             )
             # files that are "volatile" and might change between listing and streaming
             #
             # note: the ".nd" file are nodemap data and won't "change" but they might be
             # deleted.
             REVLOG_FILES_VOLATILE_EXT = (b'.n', b'.nd')
             # some exception to the above matching
             #
             # XXX This is currently not in use because of issue6542
             EXCLUDED = re.compile(br'.*undo\.[^/]+\.(nd?|i)$')
             def is_revlog(f, kind, st):
                 if kind != stat.S_IFREG:
                     return None
                 return revlog_type(f)
             def revlog_type(f):
                 # XXX we need to filter `undo.` created by the transaction here, however
                 # being naive about it also filter revlog for `undo.*` files, leading to
                 # issue6542. So we no longer use EXCLUDED.
                 if f.endswith(REVLOG_FILES_MAIN_EXT):
                     return FILEFLAGS_REVLOG_MAIN
                 elif f.endswith(REVLOG_FILES_OTHER_EXT):
                     t = FILETYPE_FILELOG_OTHER
                     if f.endswith(REVLOG_FILES_VOLATILE_EXT):
                         t |= FILEFLAGS_VOLATILE
                     return t
                 return None
             # the file is part of changelog data
             FILEFLAGS_CHANGELOG = 1 << 13
             # the file is part of manifest data
             FILEFLAGS_MANIFESTLOG = 1 << 12
             # the file is part of filelog data
             FILEFLAGS_FILELOG = 1 << 11
             # file that are not directly part of a revlog
             FILEFLAGS_OTHER = 1 << 10
             # the main entry point for a revlog
             FILEFLAGS_REVLOG_MAIN = 1 << 1
             # a secondary file for a revlog
             FILEFLAGS_REVLOG_OTHER = 1 << 0
             # files that are "volatile" and might change between listing and streaming
             FILEFLAGS_VOLATILE = 1 << 20
             FILETYPE_CHANGELOG_MAIN = FILEFLAGS_CHANGELOG | FILEFLAGS_REVLOG_MAIN
             FILETYPE_CHANGELOG_OTHER = FILEFLAGS_CHANGELOG | FILEFLAGS_REVLOG_OTHER
             FILETYPE_MANIFESTLOG_MAIN = FILEFLAGS_MANIFESTLOG | FILEFLAGS_REVLOG_MAIN
             FILETYPE_MANIFESTLOG_OTHER = FILEFLAGS_MANIFESTLOG | FILEFLAGS_REVLOG_OTHER
             FILETYPE_FILELOG_MAIN = FILEFLAGS_FILELOG | FILEFLAGS_REVLOG_MAIN
             FILETYPE_FILELOG_OTHER = FILEFLAGS_FILELOG | FILEFLAGS_REVLOG_OTHER
             FILETYPE_OTHER = FILEFLAGS_OTHER
             @attr.s(slots=True)
             class StoreFile:
                 """a file matching a store entry"""
                 unencoded_path = attr.ib()
                 _file_size = attr.ib(default=None)
                 is_volatile = attr.ib(default=False)
                 def file_size(self, vfs):
                     if self._file_size is None:
                         if vfs is None:
                             msg = b"calling vfs-less file_size without prior call: %s"
                             msg %= self.unencoded_path
                             raise error.ProgrammingError(msg)
                         try:
                             self._file_size = vfs.stat(self.unencoded_path).st_size
                         except FileNotFoundError:
                             self._file_size = 0
                     return self._file_size
                 def get_stream(self, vfs, copies):
                     """return data "stream" information for this file
                     (unencoded_file_path, content_iterator, content_size)
                     """
                     size = self.file_size(None)
                     def get_stream():
                         actual_path = copies[vfs.join(self.unencoded_path)]
                         with open(actual_path, 'rb') as fp:
                             yield None  # ready to stream
                             if size <= 65536:
                                 yield fp.read(size)
                             else:
                                 yield from util.filechunkiter(fp, limit=size)
                     s = get_stream()
                     next(s)
                     return (self.unencoded_path, s, size)
             @attr.s(slots=True, init=False)
             class BaseStoreEntry:
                 """An entry in the store
                 This is returned by `store.walk` and represent some data in the store."""
                 def files(self) -> List[StoreFile]:
                     raise NotImplementedError
                 def get_streams(
                     self,
                     repo=None,
                     vfs=None,
                     copies=None,
                     max_changeset=None,
                 ):
                     """return a list of data stream associated to files for this entry
                     return [(unencoded_file_path, content_iterator, content_size), …]
                     """
                     assert vfs is not None
                     return [f.get_stream(vfs, copies) for f in self.files()]
             @attr.s(slots=True, init=False)
             class SimpleStoreEntry(BaseStoreEntry):
                 """A generic entry in the store"""
                 is_revlog = False
                 _entry_path = attr.ib()
                 _is_volatile = attr.ib(default=False)
                 _file_size = attr.ib(default=None)
                 _files = attr.ib(default=None)
                 def __init__(
                     self,
                     entry_path,
                     is_volatile=False,
                     file_size=None,
                 ):
                     super().__init__()
                     self._entry_path = entry_path
                     self._is_volatile = is_volatile
                     self._file_size = file_size
                     self._files = None
                 def files(self) -> List[StoreFile]:
                     if self._files is None:
                         self._files = [
                             StoreFile(
                                 unencoded_path=self._entry_path,
                                 file_size=self._file_size,
                                 is_volatile=self._is_volatile,
                             )
                         ]
                     return self._files
             @attr.s(slots=True, init=False)
             class RevlogStoreEntry(BaseStoreEntry):
                 """A revlog entry in the store"""
                 is_revlog = True
                 revlog_type = attr.ib(default=None)
                 target_id = attr.ib(default=None)
                 _path_prefix = attr.ib(default=None)
                 _details = attr.ib(default=None)
                 _files = attr.ib(default=None)
                 def __init__(
                     self,
                     revlog_type,
                     path_prefix,
                     target_id,
                     details,
                 ):
                     super().__init__()
                     self.revlog_type = revlog_type
                     self.target_id = target_id
                     self._path_prefix = path_prefix
                     assert b'.i' in details, (path_prefix, details)
                     self._details = details
                     self._files = None
                 @property
                 def is_changelog(self):
                     return self.revlog_type & FILEFLAGS_CHANGELOG
                 @property
                 def is_manifestlog(self):
                     return self.revlog_type & FILEFLAGS_MANIFESTLOG
                 @property
                 def is_filelog(self):
                     return self.revlog_type & FILEFLAGS_FILELOG
                 def main_file_path(self):
                     """unencoded path of the main revlog file"""
                     return self._path_prefix + b'.i'
                 def files(self) -> List[StoreFile]:
                     if self._files is None:
                         self._files = []
                         for ext in sorted(self._details, key=_ext_key):
                             path = self._path_prefix + ext
                             data = self._details[ext]
-                            self._files.append(StoreFile(unencoded_path=path, **data))
+                            # files that are "volatile" and might change between
+                            # listing and streaming
+                            #
+                            # note: the ".nd" file are nodemap data and won't "change"
+                            # but they might be deleted.
+                            volatile = ext.endswith(REVLOG_FILES_VOLATILE_EXT)
+                            f = StoreFile(unencoded_path=path, is_volatile=volatile, **data)
+                            self._files.append(f)
                     return self._files
                 def get_streams(
                     self,
                     repo=None,
                     vfs=None,
                     copies=None,
                     max_changeset=None,
                 ):
                     if repo is None or max_changeset is None:
                         return super().get_streams(
                             repo=repo,
                             vfs=vfs,
                             copies=copies,
                             max_changeset=max_changeset,
                         )
                     if any(k.endswith(b'.idx') for k in self._details.keys()):
                         # This use revlog-v2, ignore for now
                         return super().get_streams(
                             repo=repo,
                             vfs=vfs,
                             copies=copies,
                             max_changeset=max_changeset,
                         )
                     name_to_ext = {}
                     for ext in self._details.keys():
                         name_to_ext[self._path_prefix + ext] = ext
                     name_to_size = {}
                     for f in self.files():
                         name_to_size[f.unencoded_path] = f.file_size(None)
                     stream = [
                         f.get_stream(vfs, copies)
                         for f in self.files()
                         if name_to_ext[f.unencoded_path] not in (b'.d', b'.i')
                     ]
                     is_inline = b'.d' not in self._details
                     rl = self.get_revlog_instance(repo).get_revlog()
                     rl_stream = rl.get_streams(max_changeset, force_inline=is_inline)
                     for name, s, size in rl_stream:
                         if name_to_size.get(name, 0) != size:
                             msg = _(b"expected %d bytes but %d provided for %s")
                             msg %= name_to_size.get(name, 0), size, name
                             raise error.Abort(msg)
                     stream.extend(rl_stream)
                     files = self.files()
                     assert len(stream) == len(files), (
                         stream,
                         files,
                         self._path_prefix,
                         self.target_id,
                     )
                     return stream
                 def get_revlog_instance(self, repo):
                     """Obtain a revlog instance from this store entry
                     An instance of the appropriate class is returned.
                     """
                     if self.is_changelog:
                         return changelog.changelog(repo.svfs)
                     elif self.is_manifestlog:
                         mandir = self.target_id
                         return manifest.manifestrevlog(
                             repo.nodeconstants, repo.svfs, tree=mandir
                         )
                     else:
                         return filelog.filelog(repo.svfs, self.target_id)
             def _gather_revlog(files_data):
                 """group files per revlog prefix
                 The returns a two level nested dict. The top level key is the revlog prefix
                 without extension, the second level is all the file "suffix" that were
                 seen for this revlog and arbitrary file data as value.
                 """
                 revlogs = collections.defaultdict(dict)
                 for u, value in files_data:
                     name, ext = _split_revlog_ext(u)
                     revlogs[name][ext] = value
                 return sorted(revlogs.items())
             def _split_revlog_ext(filename):
                 """split the revlog file prefix from the variable extension"""
                 if filename.endswith(REVLOG_FILES_LONG_EXT):
                     char = b'-'
                 else:
                     char = b'.'
                 idx = filename.rfind(char)
                 return filename[:idx], filename[idx:]
             def _ext_key(ext):
                 """a key to order revlog suffix
                 important to issue .i after other entry."""
                 # the only important part of this order is to keep the `.i` last.
                 if ext.endswith(b'.n'):
                     return (0, ext)
                 elif ext.endswith(b'.nd'):
                     return (10, ext)
                 elif ext.endswith(b'.d'):
                     return (20, ext)
                 elif ext.endswith(b'.i'):
                     return (50, ext)
                 else:
                     return (40, ext)
             class basicstore:
                 '''base class for local repository stores'''
                 def __init__(self, path, vfstype):
                     vfs = vfstype(path)
                     self.path = vfs.base
                     self.createmode = _calcmode(vfs)
                     vfs.createmode = self.createmode
                     self.rawvfs = vfs
                     self.vfs = vfsmod.filtervfs(vfs, encodedir)
                     self.opener = self.vfs
                 def join(self, f):
                     return self.path + b'/' + encodedir(f)
                 def _walk(self, relpath, recurse, undecodable=None):
                     '''yields (revlog_type, unencoded, size)'''
                     path = self.path
                     if relpath:
                         path += b'/' + relpath
                     striplen = len(self.path) + 1
                     l = []
                     if self.rawvfs.isdir(path):
                         visit = [path]
                         readdir = self.rawvfs.readdir
                         while visit:
                             p = visit.pop()
                             for f, kind, st in readdir(p, stat=True):
                                 fp = p + b'/' + f
                                 rl_type = is_revlog(f, kind, st)
                                 if rl_type is not None:
                                     n = util.pconvert(fp[striplen:])
                                     l.append((decodedir(n), (rl_type, st.st_size)))
                                 elif kind == stat.S_IFDIR and recurse:
                                     visit.append(fp)
                     l.sort()
                     return l
                 def changelog(self, trypending, concurrencychecker=None):
                     return changelog.changelog(
                         self.vfs,
                         trypending=trypending,
                         concurrencychecker=concurrencychecker,
                     )
                 def manifestlog(self, repo, storenarrowmatch):
                     rootstore = manifest.manifestrevlog(repo.nodeconstants, self.vfs)
                     return manifest.manifestlog(self.vfs, repo, rootstore, storenarrowmatch)
                 def data_entries(
                     self, matcher=None, undecodable=None
                 ) -> Generator[BaseStoreEntry, None, None]:
                     """Like walk, but excluding the changelog and root manifest.
                     When [undecodable] is None, revlogs names that can't be
                     decoded cause an exception. When it is provided, it should
                     be a list and the filenames that can't be decoded are added
                     to it instead. This is very rarely needed."""
                     dirs = [
                         (b'data', FILEFLAGS_FILELOG, False),
                         (b'meta', FILEFLAGS_MANIFESTLOG, True),
                     ]
                     for base_dir, rl_type, strip_filename in dirs:
                         files = self._walk(base_dir, True, undecodable=undecodable)
                         files = (f for f in files if f[1][0] is not None)
                         for revlog, details in _gather_revlog(files):
                             file_details = {}
                             revlog_target_id = revlog.split(b'/', 1)[1]
                             if strip_filename and b'/' in revlog:
                                 revlog_target_id = revlog_target_id.rsplit(b'/', 1)[0]
                                 revlog_target_id += b'/'
                             for ext, (t, s) in sorted(details.items()):
                                 file_details[ext] = {
-                                    'is_volatile': bool(t & FILEFLAGS_VOLATILE),
                                     'file_size': s,
                                 }
                             yield RevlogStoreEntry(
                                 path_prefix=revlog,
                                 revlog_type=rl_type,
                                 target_id=revlog_target_id,
                                 details=file_details,
                             )
                 def top_entries(
                     self, phase=False, obsolescence=False
                 ) -> Generator[BaseStoreEntry, None, None]:
                     if phase and self.vfs.exists(b'phaseroots'):
                         yield SimpleStoreEntry(
                             entry_path=b'phaseroots',
                             is_volatile=True,
                         )
                     if obsolescence and self.vfs.exists(b'obsstore'):
                         # XXX if we had the file size it could be non-volatile
                         yield SimpleStoreEntry(
                             entry_path=b'obsstore',
                             is_volatile=True,
                         )
                     files = reversed(self._walk(b'', False))
                     changelogs = collections.defaultdict(dict)
                     manifestlogs = collections.defaultdict(dict)
                     for u, (t, s) in files:
                         if u.startswith(b'00changelog'):
                             name, ext = _split_revlog_ext(u)
                             changelogs[name][ext] = (t, s)
                         elif u.startswith(b'00manifest'):
                             name, ext = _split_revlog_ext(u)
                             manifestlogs[name][ext] = (t, s)
                         else:
                             yield SimpleStoreEntry(
                                 entry_path=u,
                                 is_volatile=bool(t & FILEFLAGS_VOLATILE),
                                 file_size=s,
                             )
                     # yield manifest before changelog
                     top_rl = [
                         (manifestlogs, FILEFLAGS_MANIFESTLOG),
                         (changelogs, FILEFLAGS_CHANGELOG),
                     ]
                     assert len(manifestlogs) <= 1
                     assert len(changelogs) <= 1
                     for data, revlog_type in top_rl:
                         for revlog, details in sorted(data.items()):
                             file_details = {}
                             for ext, (t, s) in details.items():
                                 file_details[ext] = {
-                                    'is_volatile': bool(t & FILEFLAGS_VOLATILE),
                                     'file_size': s,
                                 }
                             yield RevlogStoreEntry(
                                 path_prefix=revlog,
                                 revlog_type=revlog_type,
                                 target_id=b'',
                                 details=file_details,
                             )
                 def walk(
                     self, matcher=None, phase=False, obsolescence=False
                 ) -> Generator[BaseStoreEntry, None, None]:
                     """return files related to data storage (ie: revlogs)
                     yields instance from BaseStoreEntry subclasses
                     if a matcher is passed, storage files of only those tracked paths
                     are passed with matches the matcher
                     """
                     # yield data files first
                     for x in self.data_entries(matcher):
                         yield x
                     for x in self.top_entries(phase=phase, obsolescence=obsolescence):
                         yield x
                 def copylist(self):
                     return _data
                 def write(self, tr):
                     pass
                 def invalidatecaches(self):
                     pass
                 def markremoved(self, fn):
                     pass
                 def __contains__(self, path):
                     '''Checks if the store contains path'''
                     path = b"/".join((b"data", path))
                     # file?
                     if self.vfs.exists(path + b".i"):
                         return True
                     # dir?
                     if not path.endswith(b"/"):
                         path = path + b"/"
                     return self.vfs.exists(path)
             class encodedstore(basicstore):
                 def __init__(self, path, vfstype):
                     vfs = vfstype(path + b'/store')
                     self.path = vfs.base
                     self.createmode = _calcmode(vfs)
                     vfs.createmode = self.createmode
                     self.rawvfs = vfs
                     self.vfs = vfsmod.filtervfs(vfs, encodefilename)
                     self.opener = self.vfs
                 def _walk(self, relpath, recurse, undecodable=None):
                     old = super()._walk(relpath, recurse)
                     new = []
                     for f1, value in old:
                         try:
                             f2 = decodefilename(f1)
                         except KeyError:
                             if undecodable is None:
                                 msg = _(b'undecodable revlog name %s') % f1
                                 raise error.StorageError(msg)
                             else:
                                 undecodable.append(f1)
                                 continue
                         new.append((f2, value))
                     return new
                 def data_entries(
                     self, matcher=None, undecodable=None
                 ) -> Generator[BaseStoreEntry, None, None]:
                     entries = super(encodedstore, self).data_entries(
                         undecodable=undecodable
                     )
                     for entry in entries:
                         if _match_tracked_entry(entry, matcher):
                             yield entry
                 def join(self, f):
                     return self.path + b'/' + encodefilename(f)
                 def copylist(self):
                     return [b'requires', b'00changelog.i'] + [b'store/' + f for f in _data]
             class fncache:
                 # the filename used to be partially encoded
                 # hence the encodedir/decodedir dance
                 def __init__(self, vfs):
                     self.vfs = vfs
                     self._ignores = set()
                     self.entries = None
                     self._dirty = False
                     # set of new additions to fncache
                     self.addls = set()
                 def ensureloaded(self, warn=None):
                     """read the fncache file if not already read.
                     If the file on disk is corrupted, raise. If warn is provided,
                     warn and keep going instead."""
                     if self.entries is None:
                         self._load(warn)
                 def _load(self, warn=None):
                     '''fill the entries from the fncache file'''
                     self._dirty = False
                     try:
                         fp = self.vfs(b'fncache', mode=b'rb')
                     except IOError:
                         # skip nonexistent file
                         self.entries = set()
                         return
                     self.entries = set()
                     chunk = b''
                     for c in iter(functools.partial(fp.read, fncache_chunksize), b''):
                         chunk += c
                         try:
                             p = chunk.rindex(b'\n')
                             self.entries.update(decodedir(chunk[: p + 1]).splitlines())
                             chunk = chunk[p + 1 :]
                         except ValueError:
                             # substring '\n' not found, maybe the entry is bigger than the
                             # chunksize, so let's keep iterating
                             pass
                     if chunk:
                         msg = _(b"fncache does not ends with a newline")
                         if warn:
                             warn(msg + b'\n')
                         else:
                             raise error.Abort(
                                 msg,
                                 hint=_(
                                     b"use 'hg debugrebuildfncache' to "
                                     b"rebuild the fncache"
                                 ),
                             )
                     self._checkentries(fp, warn)
                     fp.close()
                 def _checkentries(self, fp, warn):
                     """make sure there is no empty string in entries"""
                     if b'' in self.entries:
                         fp.seek(0)
                         for n, line in enumerate(fp):
                             if not line.rstrip(b'\n'):
                                 t = _(b'invalid entry in fncache, line %d') % (n + 1)
                                 if warn:
                                     warn(t + b'\n')
                                 else:
                                     raise error.Abort(t)
                 def write(self, tr):
                     if self._dirty:
                         assert self.entries is not None
                         self.entries = self.entries | self.addls
                         self.addls = set()
                         tr.addbackup(b'fncache')
                         fp = self.vfs(b'fncache', mode=b'wb', atomictemp=True)
                         if self.entries:
                             fp.write(encodedir(b'\n'.join(self.entries) + b'\n'))
                         fp.close()
                         self._dirty = False
                     if self.addls:
                         # if we have just new entries, let's append them to the fncache
                         tr.addbackup(b'fncache')
                         fp = self.vfs(b'fncache', mode=b'ab', atomictemp=True)
                         if self.addls:
                             fp.write(encodedir(b'\n'.join(self.addls) + b'\n'))
                         fp.close()
                         self.entries = None
                         self.addls = set()
                 def addignore(self, fn):
                     self._ignores.add(fn)
                 def add(self, fn):
                     if fn in self._ignores:
                         return
                     if self.entries is None:
                         self._load()
                     if fn not in self.entries:
                         self.addls.add(fn)
                 def remove(self, fn):
                     if self.entries is None:
                         self._load()
                     if fn in self.addls:
                         self.addls.remove(fn)
                         return
                     try:
                         self.entries.remove(fn)
                         self._dirty = True
                     except KeyError:
                         pass
                 def __contains__(self, fn):
                     if fn in self.addls:
                         return True
                     if self.entries is None:
                         self._load()
                     return fn in self.entries
                 def __iter__(self):
                     if self.entries is None:
                         self._load()
                     return iter(self.entries | self.addls)
             class _fncachevfs(vfsmod.proxyvfs):
                 def __init__(self, vfs, fnc, encode):
                     vfsmod.proxyvfs.__init__(self, vfs)
                     self.fncache = fnc
                     self.encode = encode
                 def __call__(self, path, mode=b'r', *args, **kw):
                     encoded = self.encode(path)
                     if (
                         mode not in (b'r', b'rb')
                         and (path.startswith(b'data/') or path.startswith(b'meta/'))
                         and revlog_type(path) is not None
                     ):
                         # do not trigger a fncache load when adding a file that already is
                         # known to exist.
                         notload = self.fncache.entries is None and self.vfs.exists(encoded)
                         if notload and b'r+' in mode and not self.vfs.stat(encoded).st_size:
                             # when appending to an existing file, if the file has size zero,
                             # it should be considered as missing. Such zero-size files are
                             # the result of truncation when a transaction is aborted.
                             notload = False
                         if not notload:
                             self.fncache.add(path)
                     return self.vfs(encoded, mode, *args, **kw)
                 def join(self, path):
                     if path:
                         return self.vfs.join(self.encode(path))
                     else:
                         return self.vfs.join(path)
                 def register_file(self, path):
                     """generic hook point to lets fncache steer its stew"""
                     if path.startswith(b'data/') or path.startswith(b'meta/'):
                         self.fncache.add(path)
             class fncachestore(basicstore):
                 def __init__(self, path, vfstype, dotencode):
                     if dotencode:
                         encode = _pathencode
                     else:
                         encode = _plainhybridencode
                     self.encode = encode
                     vfs = vfstype(path + b'/store')
                     self.path = vfs.base
                     self.pathsep = self.path + b'/'
                     self.createmode = _calcmode(vfs)
                     vfs.createmode = self.createmode
                     self.rawvfs = vfs
                     fnc = fncache(vfs)
                     self.fncache = fnc
                     self.vfs = _fncachevfs(vfs, fnc, encode)
                     self.opener = self.vfs
                 def join(self, f):
                     return self.pathsep + self.encode(f)
                 def getsize(self, path):
                     return self.rawvfs.stat(path).st_size
                 def data_entries(
                     self, matcher=None, undecodable=None
                 ) -> Generator[BaseStoreEntry, None, None]:
                     files = ((f, revlog_type(f)) for f in self.fncache)
                     # Note: all files in fncache should be revlog related, However the
                     # fncache might contains such file added by previous version of
                     # Mercurial.
                     files = (f for f in files if f[1] is not None)
                     by_revlog = _gather_revlog(files)
                     for revlog, details in by_revlog:
                         file_details = {}
                         if revlog.startswith(b'data/'):
                             rl_type = FILEFLAGS_FILELOG
                             revlog_target_id = revlog.split(b'/', 1)[1]
                         elif revlog.startswith(b'meta/'):
                             rl_type = FILEFLAGS_MANIFESTLOG
                             # drop the initial directory and the `00manifest` file part
                             tmp = revlog.split(b'/', 1)[1]
                             revlog_target_id = tmp.rsplit(b'/', 1)[0] + b'/'
                         else:
                             # unreachable
                             assert False, revlog
                         for ext, t in details.items():
-                            file_details[ext] = {
+                            file_details[ext] = {}
-                                'is_volatile': bool(t & FILEFLAGS_VOLATILE),
                         entry = RevlogStoreEntry(
                             path_prefix=revlog,
                             revlog_type=rl_type,
                             target_id=revlog_target_id,
                             details=file_details,
                         )
                         if _match_tracked_entry(entry, matcher):
                             yield entry
                 def copylist(self):
                     d = (
                         b'bookmarks',
                         b'narrowspec',
                         b'data',
                         b'meta',
                         b'dh',
                         b'fncache',
                         b'phaseroots',
                         b'obsstore',
                         b'00manifest.d',
                         b'00manifest.i',
                         b'00changelog.d',
                         b'00changelog.i',
                         b'requires',
                     )
                     return [b'requires', b'00changelog.i'] + [b'store/' + f for f in d]
                 def write(self, tr):
                     self.fncache.write(tr)
                 def invalidatecaches(self):
                     self.fncache.entries = None
                     self.fncache.addls = set()
                 def markremoved(self, fn):
                     self.fncache.remove(fn)
                 def _exists(self, f):
                     ef = self.encode(f)
                     try:
                         self.getsize(ef)
                         return True
                     except FileNotFoundError:
                         return False
                 def __contains__(self, path):
                     '''Checks if the store contains path'''
                     path = b"/".join((b"data", path))
                     # check for files (exact match)
                     e = path + b'.i'
                     if e in self.fncache and self._exists(e):
                         return True
                     # now check for directories (prefix match)
                     if not path.endswith(b'/'):
                         path += b'/'
                     for e in self.fncache:
                         if e.startswith(path) and self._exists(e):
                             return True
                     return False